Add solutions to 018 by E. Choroba

There are two different files for the first task, one of them searches the longest common substring naively, the second one uses a suffix tree. The priority queue is also implemented in two different ways, but in one file only: using an array or a heap.
author: E. Choroba <choroba@matfyz.cz> 2019-07-26 00:20:01 +0200
committer: E. Choroba <choroba@matfyz.cz> 2019-07-26 00:20:01 +0200
commit: 4d1a5e75514d48d0dd0583d2e94e702ec4355361 (patch)
tree: cea57a4f2a7da5cd9b0174e13c3d30c589216cd5
parent: 7b0e5c1aed8203488c1745a12bf2eb79ef262dd4 (diff)
download: perlweeklychallenge-club-4d1a5e75514d48d0dd0583d2e94e702ec4355361.tar.gz
perlweeklychallenge-club-4d1a5e75514d48d0dd0583d2e94e702ec4355361.tar.bz2
perlweeklychallenge-club-4d1a5e75514d48d0dd0583d2e94e702ec4355361.zip
3 files changed, 296 insertions, 0 deletions
diff --git a/challenge-018/e-choroba/perl5/ch-1a.pl b/challenge-018/e-choroba/perl5/ch-1a.pl
new file mode 100755
index 0000000000..3bb93311c7
--- /dev/null
+++ b/challenge-018/e-choroba/perl5/ch-1a.pl
@@ -0,0 +1,24 @@
+#!/usr/bin/perl
+use warnings;
+use strict;
+use feature qw{ say };
+
+my @longest = ("");
+my $string  = shift;
+for my $pos (1 .. length $string) {
+    for my $length (1 .. 1 - $pos + length $string) {
+        next if $length < length $longest[0];
+
+        my $substr = substr $string, $pos - 1, $length;
+        my $found = 0;
+        -1 != index $_, $substr and ++$found for @ARGV;
+        if ($found == @ARGV) {
+            if ($length == length $longest[0]) {
+                push @longest, $substr;
+            } else {
+                @longest = $substr;
+            }
+        }
+    }
+}
+say "<$_>" for @longest;
diff --git a/challenge-018/e-choroba/perl5/ch-1b.pl b/challenge-018/e-choroba/perl5/ch-1b.pl
new file mode 100755
index 0000000000..fcbdfc0972
--- /dev/null
+++ b/challenge-018/e-choroba/perl5/ch-1b.pl
@@ -0,0 +1,181 @@
+#!/usr/bin/perl
+use warnings;
+use strict;
+use feature qw{ say };
+
+{   package My::Node;
+    sub new { bless { start => $_[1], end => $_[2] }, $_[0] }
+    sub edge_length {
+        my ($self, $position) = @_;
+        ($self->{end} < $position + 1
+            ? $self->{end}
+            : $position + 1
+        ) - $self->{start}
+    }
+}
+
+{   package My::Suffix::Tree;
+
+    sub new {
+        my ($class) = @_;
+        bless my $self = {position => -1,
+                          text => "",
+                          active_edge => 0,
+                          active_length => 0,
+                          current_node => -1,
+        }, $class;
+        $self->{root} = $self->new_node(-1, -1);
+        $self->{active_node} = $self->{root};
+        return $self
+    }
+
+    sub add_numbers {
+        my ($self, $node_index) = @_;
+        my $node = $self->{nodes}[$node_index];
+        for my $next_index (values %{ $node->{next} }) {
+            undef $node->{numbers}{$_} for $self->add_numbers($next_index);
+        }
+        return $node->{number} // () unless exists $node->{numbers};
+
+        return keys %{ $self->{numbers} }
+    }
+
+    sub add_words {
+        my ($self, @words) = @_;
+        $self->{number_of_words} = @ARGV;
+        for my $word_index (0 .. $#words) {
+            $self->add_char($_)
+                for split //, "$words[$word_index]<$word_index>";
+        }
+        my $text_length = length $self->{text};
+        for my $node (@{ $self->{nodes} }) {
+            next if $node->{start} < 0;
+            my $text = $node->{end} > $text_length
+                     ? substr $self->{text}, $node->{start}
+                     : substr $self->{text}, $node->{start},
+                           $node->{end} - $node->{start};
+            $node->{text} = $text;
+            if (my ($number) =  $text =~ /<([0-9]+)>/) {
+                $node->{number} = $number;
+            }
+        }
+        $self->add_numbers(0);
+    }
+
+    sub _add_suffix_link {
+        my ($self, $node) = @_;
+        $self->{nodes}[ $self->{need_suffix_link} ]{link} = $node
+            if $self->{need_suffix_link} > 0;
+        $self->{need_suffix_link} = $node;
+    }
+
+    sub active_edge { substr $_[0]{text}, $_[0]{active_edge}, 1 }
+
+    sub walk_down {
+        my ($self, $next) = @_;
+        $next //= 0;
+        my $position = $self->{position};
+        if ($self->{active_length}
+            >= $self->{nodes}[$next]->edge_length($position)
+        ) {
+            $self->{active_edge}
+                += $self->{nodes}[$next]->edge_length($position);
+            $self->{active_length}
+                -= $self->{nodes}[$next]->edge_length($position);
+            $self->{active_node} = $next;
+            return 1
+        }
+        return
+    }
+
+    sub new_node {
+        my ($self, $start, $end) = @_;
+        $self->{nodes}[ ++$self->{current_node} ]
+            = 'My::Node'->new($start, $end);
+        $self->{current_node}
+    }
+
+    sub add_char {
+        my ($self, $char) = @_;
+        substr $self->{text}, ++$self->{position}, 1, $char;
+        $self->{need_suffix_link} = -1;
+        ++$self->{remainder};
+        while ($self->{remainder} > 0) {
+            $self->{active_edge} = $self->{position}
+                unless $self->{active_length};
+            if (! exists
+                $self->{nodes}[ $self->{active_node} ]{next}{ $self->active_edge }
+            ) {
+                $self->{nodes}[ $self->{active_node} ]
+                    {next}{ $self->active_edge }
+                    = $self->new_node($self->{position}, 'INF');
+                $self->_add_suffix_link($self->{active_node});  # Rule 2.
+            } else {
+                my $next = $self->{nodes}[ $self->{active_node} ]
+                    {next}{ $self->active_edge };
+                next if $self->walk_down($next);  # Observation 2.
+
+                # Observation 2.
+                if ($char eq substr $self->{text},
+                        $self->{nodes}[$next]{start} + $self->{active_length}, 1
+                ) {
+                    ++$self->{active_length};
+                    $self->_add_suffix_link($self->{active_node});  # Observation 3.
+                    last
+                }
+                my $split = $self->new_node($self->{nodes}[$next]{start},
+                    $self->{nodes}[$next]{start} + $self->{active_length});
+                $self->{nodes}[ $self->{active_node} ]{next}
+                    { $self->active_edge } = $split;
+                my $leaf = $self->new_node($self->{position}, 'INF');
+                $self->{nodes}[$split]{next}{$char} = $leaf;
+                $self->{nodes}[$next]{start} += $self->{active_length};
+                $self->{nodes}[$split]{next}{ substr $self->{text},
+                    $self->{nodes}[$next]{start}, 1 } = $next;
+                $self->_add_suffix_link($split);  # Rule 2.
+            }
+            -- $self->{remainder};
+
+            if ($self->{active_node} == $self->{root}
+                && $self->{active_length} > 0  # Rule 1.
+            ) {
+                --$self->{active_length};
+                $self->{active_edge}
+                    = $self->{position} - $self->{remainder} + 1;
+            } else {
+                $self->{nodes}[ $self->{active_node} ]{link} //= 0;
+                $self->{active_node}
+                    = $self->{nodes}[ $self->{active_node} ]{link} > 0
+                    ? $self->{nodes}[ $self->{active_node} ]{link}
+                    : $self->{root};  # Rule 3.
+            }
+        }
+    }
+
+    my @lcs;
+    sub longest_common_substring {
+        my ($self, $node_index, $string) = @_;
+        @lcs = ("") unless $node_index;
+        my $node = $self->{nodes}[$node_index];
+
+        if ($self->{number_of_words} == keys %{ $node->{numbers} }) {
+            my $compare_lengths = length $string <=> length $lcs[0];
+            push @lcs, $string if $compare_lengths == 0;
+            @lcs = ($string) if $compare_lengths == 1;
+        }
+
+        for my $next_char (keys %{ $node->{next} }) {
+            my $next_index = $node->{next}{$next_char};
+            my $next = $self->{nodes}[$next_index];
+            $self->longest_common_substring(
+                $next_index,
+                "$string$next->{text}");
+        }
+        return @lcs
+    }
+}
+
+my $o = 'My::Suffix::Tree'->new;
+$o->add_words(@ARGV);
+
+say "<$_>" for $o->longest_common_substring(0, "");
diff --git a/challenge-018/e-choroba/perl5/ch-2.pl b/challenge-018/e-choroba/perl5/ch-2.pl
new file mode 100755
index 0000000000..79c11f00a0
--- /dev/null
+++ b/challenge-018/e-choroba/perl5/ch-2.pl
@@ -0,0 +1,91 @@
+#!/usr/bin/perl
+use warnings;
+use strict;
+
+{   package My::Queue::Priority::Array;
+
+    sub new { bless [], shift }
+
+    sub is_empty { ! grep @{ $_ // [] }, @{ $_[0] } }
+
+    sub insert_with_priority {
+        my ($self, $element, $priority) = @_;
+        push @{ $self->[$priority] }, $element;
+    }
+
+    sub pull_highest_priority_element {
+        my ($self) = @_;
+        my ($i) = grep @{ $self->[$_] || [] }, reverse 0 .. $#$self;
+        shift @{ $self->[$i] }
+    }
+}
+
+{   package My::Queue::Priority::Heap;
+    use enum qw( ELEMENT PRIORITY );
+
+    sub new { bless [], shift }
+
+    sub is_empty { ! @{ $_[0] } }
+
+    sub insert_with_priority {
+        my ($self, $element, $priority) = @_;
+        push @$self, [$element, $priority];
+        my $i = $#$self;
+        my $p = int(($i - 1) / 2);
+        while ($p >= 0 && $self->[$p][PRIORITY] < $self->[$i][PRIORITY]) {
+            @$self[$i, $p] = @$self[$p, $i];
+            $i = $p;
+            $p = int(($i - 1) / 2);
+        }
+    }
+
+    sub pull_highest_priority_element {
+        my ($self) = @_;
+        my $element = shift(@$self)->[ELEMENT];
+        my $new = ref($self)->new;
+        $new->insert_with_priority(@$_) for reverse @$self;
+        $_[0] = $new;
+        return $element
+    }
+}
+
+use Test::More tests => 2 * 14;
+
+for my $class (qw(My::Queue::Priority::Array My::Queue::Priority::Heap)) {
+    my $q = $class->new();
+    ok $q->is_empty;
+
+    $q->insert_with_priority(@$_)
+        for [a => 10], [b => 4], [c => 2], [d=>8], [e => 4], [f => 3];
+    ok ! $q->is_empty;
+
+    is $q->pull_highest_priority_element, 'a';
+    ok ! $q->is_empty;
+    is $q->pull_highest_priority_element, 'd';
+    ok ! $q->is_empty;
+    is $q->pull_highest_priority_element, 'b';
+    ok ! $q->is_empty;
+    is $q->pull_highest_priority_element, 'e';
+    ok ! $q->is_empty;
+    is $q->pull_highest_priority_element, 'f';
+    ok ! $q->is_empty;
+    is $q->pull_highest_priority_element, 'c';
+    ok $q->is_empty;
+}
+
+use Benchmark qw{ cmpthese };
+cmpthese(-3, {
+    heap => sub {
+        my $q = My::Queue::Priority::Heap->new;
+        $q->insert_with_priority(@$_)
+            for [a => 10], [b => 4], [c => 2], [d=>8], [e => 4], [f => 3];
+        $q->pull_highest_priority_element for 1 .. 6;
+    },
+    array => sub {
+        my $q = My::Queue::Priority::Array->new;
+        $q->insert_with_priority(@$_)
+            for [a => 10], [b => 4], [c => 2], [d=>8], [e => 4], [f => 3];
+        $q->pull_highest_priority_element for 1 .. 6;
+    }
+
+});
author	E. Choroba <choroba@matfyz.cz>	2019-07-26 00:20:01 +0200
committer	E. Choroba <choroba@matfyz.cz>	2019-07-26 00:20:01 +0200
commit	4d1a5e75514d48d0dd0583d2e94e702ec4355361 (patch)
tree	cea57a4f2a7da5cd9b0174e13c3d30c589216cd5
parent	7b0e5c1aed8203488c1745a12bf2eb79ef262dd4 (diff)
download	perlweeklychallenge-club-4d1a5e75514d48d0dd0583d2e94e702ec4355361.tar.gz perlweeklychallenge-club-4d1a5e75514d48d0dd0583d2e94e702ec4355361.tar.bz2 perlweeklychallenge-club-4d1a5e75514d48d0dd0583d2e94e702ec4355361.zip