hpricot:An Hpricot Showcase:Hpricot Challenge:Strip all HTML tags

まんま

>> require "hpricot"
=> true
>> doc = Hpricot('<p>foo1</p><p>foo2<a href="http://www.foo3.org/">foo3</a></p>')
=> #<Hpricot::Doc {elem <p> "foo1" </p>} {elem <p> "foo2" {elem <a href="http://www.foo3.org/"> "foo3" </a>} </p>}>
>> doc.to_plain_text
=> "foo1\n\nfoo2foo3 [http://www.foo3.org/]"
>> doc.inner_text
=> "foo1foo2foo3"
>> doc = Hpricot('<a href="http://www.math.com" title="1 > 2">1 is > 2')
=> #<Hpricot::Doc {elem <a href="http://www.math.com" title="1 > 2"> "1 is > 2"}>
>> doc.to_plain_text
=> "1 is > 2 [http://www.math.com]"
>> doc.inner_text
=> "1 is > 2"