fortune_html_parser.py 1.9 KB

1234567891011121314151617181920212223242526272829
  1. # -*- coding: utf-8
  2. from HTMLParser import HTMLParser
  3. class FortuneHTMLParser(HTMLParser):
  4. body = []
  5. valid = '<!DOCTYPE html><html><head><title>Fortunes</title></head><body><table><tr><th>id</th><th>message</th></tr><tr><td>11</td><td>&lt;script&gt;alert("This should not be displayed in a browser alert box.");&lt;/script&gt;</td></tr><tr><td>4</td><td>A bad random number generator: 1, 1, 1, 1, 1, 4.33e+67, 1, 1, 1</td></tr><tr><td>5</td><td>A computer program does what you tell it to do, not what you want it to do.</td></tr><tr><td>2</td><td>A computer scientist is someone who fixes things that aren\'t broken.</td></tr><tr><td>8</td><td>A list is only as strong as its weakest link. — Donald Knuth</td></tr><tr><td>0</td><td>Additional fortune added at request time.</td></tr><tr><td>3</td><td>After enough decimal places, nobody gives a damn.</td></tr><tr><td>7</td><td>Any program that runs right is obsolete.</td></tr><tr><td>10</td><td>Computers make very fast, very accurate mistakes.</td></tr><tr><td>6</td><td>Emacs is a nice operating system, but I prefer UNIX. — Tom Christaensen</td></tr><tr><td>9</td><td>Feature: A bug with seniority.</td></tr><tr><td>1</td><td>fortune: No such file or directory</td></tr><tr><td>12</td><td>フレームワークのベンチマーク</td></tr></table></body></html>'
  6. def handle_decl(self, decl):
  7. self.body.append("<!{d}>".format(d=decl))
  8. def handle_entityref(self, name):
  9. self.body.append("&{n};".format(n=name))
  10. def handle_starttag(self, tag, attrs):
  11. self.body.append("<{t}>".format(t=tag))
  12. def handle_data (self, data):
  13. self.body.append("{d}".format(d=data.strip()))
  14. def handle_endtag(self, tag):
  15. self.body.append("</{t}>".format(t=tag))
  16. def isValidFortune(self):
  17. print "Valid: {v}\n".format(v=self.valid)
  18. print "Input: {i}\n".format(i=''.join(self.body))
  19. print "Equal: {e}\n".format(e=str(self.valid == self.body))
  20. return self.valid == ''.join(self.body)