Permalink
Browse files

HTML table parsing requires UTF8 decoding

  • Loading branch information...
1 parent c07503c commit af4159582821caa23d4ba6d008ba08ead810c0a6 Chris Fields committed Feb 19, 2013
Showing with 2 additions and 1 deletion.
  1. +2 −1 Bio/DB/SeqVersion/gi.pm
@@ -102,6 +102,7 @@ methods. Internal methods are usually preceded with a _
package Bio::DB::SeqVersion::gi;
use strict;
+use Encode;
use HTML::TableExtract;
use base qw(Bio::DB::SeqVersion);
@@ -278,7 +279,7 @@ sub _process_data {
my $te = HTML::TableExtract->new(
headers => ['Gi', 'Version', 'Update Date'] ,
depth => 0);
- $te->parse($html);
+ $te->parse(decode_utf8($html));
my $table = $te->first_table_found;
$self->throw("No table found") unless defined $table;
my $t = [$table->rows];

0 comments on commit af41595

Please sign in to comment.