Changeset 1607

Show
Ignore:
Timestamp:
08/27/06 15:28:57
Author:
miyagawa
Message:
  • Aggregator::Simple: support per-entry level language
  • Filter::GuessLanguage?: fixed language accessor
  • Plagger::Util: Fixed plaintext() to decode utf8 before dumping to HTML
Files:

Legend:

Unmodified
Added
Removed
Modified
Copied
Moved
  • branches/hackathon-summary/plagger/lib/Plagger/Plugin/Aggregator/Simple.pm

    r1580 r1607  
    143143        $entry->summary($summary) if $summary; 
    144144 
     145        # per-entry level language support in Atom 
     146        if ($e->{entry}->content && $e->{entry}->content->lang) { 
     147            $entry->language($e->{entry}->content->lang); 
     148        } 
     149 
    145150        # enclosure support, to be added to XML::Feed 
    146151        if ($remote->format =~ /^RSS / and my $encls = $e->{entry}->{enclosure}) { 
  • branches/hackathon-summary/plagger/lib/Plagger/Plugin/Filter/GuessLanguage.pm

    r1554 r1607  
    121121    my ($self, $context, $args) = @_; 
    122122 
    123     return $args->{entry}->{language} if $args->{entry}->{language}
     123    return $args->{entry}->language if $args->{entry}->language
    124124 
    125125    $context->log(debug => "start guessing entry's language"); 
  • branches/hackathon-summary/plagger/lib/Plagger/Util.pm

    r1549 r1607  
    2828sub strip_html { 
    2929    my $html = shift; 
     30    utf8::decode($html); 
    3031 
    3132    eval { 
     
    4647    my $formatter = HTML::FormatText->new(leftmargin => 0); 
    4748    my $text = $formatter->format($tree); 
     49#    utf8::decode($text); 
    4850    $text =~ s/\s*$//s; 
    4951    $text; 
  • branches/hackathon-summary/plagger/t/samples/atom10-example.xml

    r1201 r1607  
    11<?xml version="1.0" encoding="utf-8"?> 
    2 <feed xmlns="http://www.w3.org/2005/Atom"
     2<feed xmlns="http://www.w3.org/2005/Atom" xml:lang="en"
    33 
    44  <title>Example Feed</title> 
     
    1818  </entry> 
    1919 
     20  <entry> 
     21    <title>Atom-Powered Robots Run Amok</title> 
     22    <link href="http://example.org/2003/12/13/atom03"/> 
     23    <id>urn:uuid:1225c695-cfb8-4ebb-aaaa-80da344efa6a</id> 
     24    <updated>2003-12-13T18:30:02Z</updated> 
     25    <summary>Some text.</summary> 
     26    <content type="xhtml" xml:lang="ja"> 
     27      <div xmlns="http://www.w3.org/1999/xhtml">foo</div> 
     28    </content> 
     29  </entry> 
     30 
    2031</feed>