ʹÓÃpython»ñÈ¡htmlÒ³ÃæµÄÄÚÈÝ
import urllib
from HTMLParser import HTMLParser
class TitleParser(HTMLParser):
def __init__(self):
self.title = ''
self.divcontent = ''
self.readingtitle = 0
self.readingdiv = 0
HTMLParser.__init__(self)
def handle_starttag(self, tag, attrs):
if tag == 'title':
self.readingtitle = 1
if -1 != tag.find("div"):
self.readingdiv = 1
def handle_data(self, data):
if self.readingtitle:
# Ordinarily, this is slow and a bad practice, but
# we can get away with it because a title is usually
# small and simple.
self.title += data
if self.readingdiv:
self.divcontent += data
def handle_endtag(self, tag):
if tag == 'title':
self.readingtitle = 0
if tag == "div":
self.readingdiv = 0
def gettitle(self):
return self.title
def getdiv(self):
return self.divcontent
def getweb(url):
web = urllib.urlopen('http://blog.chinaunix.net/u3/105068/showart_2223566.html').read()
return web
web = getweb('http://blog.chinaunix.net/u3/105068/showart_2223566.html')
test = TitleParser()
test.feed(web)
file_object = open('abinfile', 'w')
file_object.write(test.title)
file_object.write("\r\n")
file_object.write(test.divcontent)
file_object.close()
Ïà¹ØÎĵµ£º
¡¡¡¡1¡¢Óñí¸ñ×öÁ÷¶¯·Ö¸îÏß
¡¡¡¡ÎÒÃÇÖªµÀ£¬ÔÚÍøÒ³ÖпÉÒÔÓÃ<hr>±êʶÀ´×ö·Ö¸îÏߣ¬Ò²¿ÉÒ԰ѱí¸ñÉèÖÃΪ1¸öÏóËØ¸ß»ò¿í³äµ±·Ö¸îÏß¡£ÏÖÔÚ£¬ÎÒÃǽ«±í¸ñÓëJavascript½áºÏ£¬¿ÉÒÔ×ö³ö¸üÉú¶¯µÄ·Ö¸îÏß——Á÷¶¯µÄ·Ö¸îÏß¡£¼ÓÈëÒÔÏ´úÂ룬Äã¾Í¿ÉÒÔ¿´µ½Ò»Ìõ·Ö¸îÏߣ¬ÑÕÉ«ÔÚ²»¶ÏµÄÁ÷¶¯¡£
<script>
l=Array(6,7,8,9, ......
ʹÓà VAlign ÊôÐÔÖ¸¶¨ÓÉ HtmlTableCell ÀàµÄʵÀýËù±íʾµÄµ¥Ôª¸ñÄÚÈݵĴ¹Ö±¶ÔÆë·½Ê½
“VALIGN"Òâ˼ -- vertical alignment ´¹Ïò¶ÔÆë·½·¨
ÆäÖµ¿ÉÒÔÊÇtop -- ¶¥²¿£»»òmiddle -- Öв¿£»»òbottom-- µ×²¿£»»òbaseline -- »ùÏß¡£Ä¬ÈÏÖв¿--middle¡£
¶ÔÆë£¬¾ÍÊDZí¸ñ£¨Cell)ÄڵĶ«Î÷£¨ÔªËذüÀ¨Í¼ÐΣ©ÅŵÃÕûÆë»®Ò»£¬V ......
´ó¼Ò¶¼ÖªµÀÔÚtableµÄijһ¸ñÀï²åÈëÎı¾Ê±,Èç¹ûÊÇÖÐÎĵ±È»ÊÇûÓÐÎÊÌâ,µ±µ½´ïÖ¸¶¨¿í¶Èʱ»á×Ô¶¯»»ÐÐ,µ«Èç¹ûÊÇÓ¢ÎÄ»òÊý×ÖÖ®ÀàµÄ¾Í»áÓÐÎÊÌâÁË.ÒòΪËüÊÇÒÔ¿Õ¸ñΪӢÎĵ¥´Ê¼äµÄÇø±ð,µ«ÊÇÈç¹ûÊäÈëÒ»³¤´®Ó¢ÎÄ,Öм䲻º¬¿Õ¸ñʱ,±í¸ñ¾Í±äÐÎÁË.µ«ÊÂʵtableµÄstyleÀïÓÐÒ»Ïî¿ÉÒÔÈÃÓ¢ÎÄÇ¿ÖÆ»»ÐеÄ,¾ÍÊÇword-break,µ±°ÑÕâÏîÉèΪbreak-allʱ´ó¼Ò ......
1£® Ê×ÏȾÍÊÇÔÚ±àÒëÆ÷ÖаÑpython°²×°Ä¿Â¼include/Óëlibs/¼ÓÈ룬¶ÔÓÚÕâµãÎÒÔÚvc6ÖпÉÒÔ£¬µ«ÊÇÔÚdev c++Öм´Ê¹¼ÓÈëÁ˱àÒëÒ²»á³ö´í£¬ËµÕÒ²»µ½pythonÍ·Îļþ£¬Õâµã±È½ÏÓôÃÆ£¬²»¹ý¿¼Âǵ½Ò»°ãwindows±à³Ì¶¼ÓõÄÊÇvc£¬ËùÒÔ²¢Ã»ÓÐʲôӰÏì°É£¡£¡£¡
È»ºóÓÃ#include <Python.h>¾Í¿ÉÒÔ°ÑpythonµÄÖ÷Í·Îļþ°üº¬½øÀ´ÁË¡£
µ«Ê ......