hpricot:An Hpricot Showcase:Hpricot Challenge:Strip all HTML tags
まんま
>> require "hpricot" => true >> doc = Hpricot('<p>foo1</p><p>foo2<a href="http://www.foo3.org/">foo3</a></p>') => #<Hpricot::Doc {elem <p> "foo1" </p>} {elem <p> "foo2" {elem <a href="http://www.foo3.org/"> "foo3" </a>} </p>}> >> doc.to_plain_text => "foo1\n\nfoo2foo3 [http://www.foo3.org/]" >> doc.inner_text => "foo1foo2foo3" >> doc = Hpricot('<a href="http://www.math.com" title="1 > 2">1 is > 2') => #<Hpricot::Doc {elem <a href="http://www.math.com" title="1 > 2"> "1 is > 2"}> >> doc.to_plain_text => "1 is > 2 [http://www.math.com]" >> doc.inner_text => "1 is > 2"