fortune_html_parser.py 1.6 KB

1234567891011121314151617181920212223
  1. # -*- coding: utf-8
  2. from HTMLParser import HTMLParser
  3. class FortuneHTMLParser(HTMLParser):
  4. body = []
  5. valid = '<!DOCTYPE html><html><head><title>Fortunes</title></head><body><table><tr><th>id</th><th>message</th></tr><tr><td>11</td><td>&lt;script&gt;alert("This should not be displayed in a browser alert box.");&lt;/script&gt;</td></tr><tr><td>4</td><td>A bad random number generator: 1, 1, 1, 1, 1, 4.33e+67, 1, 1, 1</td></tr><tr><td>5</td><td>A computer program does what you tell it to do, not what you want it to do.</td></tr><tr><td>2</td><td>A computer scientist is someone who fixes things that aren\'t broken.</td></tr><tr><td>8</td><td>A list is only as strong as its weakest link. — Donald Knuth</td></tr><tr><td>0</td><td>Additional fortune added at request time.</td></tr><tr><td>3</td><td>After enough decimal places, nobody gives a damn.</td></tr><tr><td>7</td><td>Any program that runs right is obsolete.</td></tr><tr><td>10</td><td>Computers make very fast, very accurate mistakes.</td></tr><tr><td>6</td><td>Emacs is a nice operating system, but I prefer UNIX. — Tom Christaensen</td></tr><tr><td>9</td><td>Feature: A bug with seniority.</td></tr><tr><td>1</td><td>fortune: No such file or directory</td></tr><tr><td>12</td><td>フレームワークのベンチマーク</td></tr></table></body></html>'
  6. def handle_decl(self, decl, args):
  7. print "decl: '{d}'".format(d=decl)
  8. def handle_starttag(self, tag, attrs):
  9. print "start tag: '{s}'".format(s=tag)
  10. def handle_data (self, data):
  11. print "data: '{s}'".format(s=data)
  12. def handle_endtag(self, tag):
  13. print "end tag: '{s}'".format(s=tag)
  14. def isValidFortune(self):
  15. return True