4 soup = BeautifulSoup.BeautifulSoup
6 class imgstream(object):
7 def __init__(self, url):
8 self.bk = urllib.urlopen(url)
9 self.ctype = self.bk.info()["Content-Type"]
14 def read(self, sz = None):
18 return self.bk.read(sz)
21 def __init__(self, chapter, n, url):
22 self.chapter = chapter
23 self.volume = self.chapter.volume
24 self.manga = self.volume.manga
30 if self.ciurl is None:
31 page = soup(htcache.fetch(self.url))
32 self.ciurl = page.find("div", id="viewer").find("img", id="image")["src"]
36 return imgstream(self.iurl())
38 class chapter(lib.pagelist):
39 def __init__(self, volume, name, url):
41 self.manga = volume.manga
46 def __getitem__(self, i):
47 return self.pages()[i]
50 return len(self.pages())
54 pg = soup(htcache.fetch(self.url + "1.html"))
55 l = pg.find("form", id="top_bar").find("div", attrs={"class": "l"})
56 if len(l.contents) != 3:
57 raise Exception("parse error: weird page list for %r" % self)
58 m = l.contents[2].strip()
60 raise Exception("parse error: weird page list for %r" % self)
61 self.cpag = [page(self, n + 1, self.url + ("%i.html" % (n + 1))) for n in xrange(int(m[3:]))]
68 return "<mangafox.chapter %r.%r.%r>" % (self.manga.name, self.volume.name, self.name)
70 class volume(lib.pagelist):
71 def __init__(self, manga, name):
76 def __getitem__(self, i):
86 return "<mangafox.volume %r.%r>" % (self.manga.name, self.name)
91 if isinstance(el, BeautifulSoup.Tag):
94 class manga(lib.manga):
95 def __init__(self, lib, name, url):
101 def __getitem__(self, i):
102 return self.vols()[i]
105 return len(self.vols())
108 if self.cvol is None:
109 page = soup(htcache.fetch(self.url))
110 vls = page.find("div", id="chapters").findAll("div", attrs={"class": "slide"})
112 for i in xrange(len(vls)):
113 vol = volume(self, vls[i].find("h3", attrs={"class": "volume"}).contents[0].strip())
115 if cls.name != u"ul" or cls["class"] != u"chlist":
116 raise Exception("parse error: weird volume list for %r" % self)
117 for ch in cls.findAll("li"):
118 n = ch.div.h3 or ch.div.h4
120 for span in ch("span"):
122 if u" title " in (u" " + span["class"] + u" "):
123 name += " " + span.string
126 url = n.a["href"].encode("us-ascii")
127 if url[-7:] != "/1.html":
128 raise Exception("parse error: unexpected chapter URL for %r: %s" % (self, url))
129 vol.ch.insert(0, chapter(vol, name, url[:-6]))
130 self.cvol.insert(0, vol)
137 return "<mangafox.manga %r>" % self.name
139 def libalphacmp(a, b):
140 return cmp(a.upper(), b.upper())
142 class library(lib.library):
144 self.base = "http://www.mangafox.com/"
146 def alphapage(self, pno):
147 page = soup(htcache.fetch(self.base + ("directory/%i.htm?az" % pno)))
148 ls = page.find("div", id="mangalist").find("ul", attrs={"class": "list"}).findAll("li")
151 t = m.find("div", attrs={"class": "manga_text"}).find("a", attrs={"class": "title"})
153 url = t["href"].encode("us-ascii")
154 ret.append(manga(self, name, url))
157 def alphapages(self):
158 page = soup(htcache.fetch(self.base + "directory/?az"))
159 ls = page.find("div", id="mangalist").find("div", id="nav").find("ul").findAll("li")
160 return int(ls[-2].find("a").string)
162 def byname(self, prefix):
163 if not isinstance(prefix, unicode):
164 prefix = prefix.decode("utf8")
166 r = self.alphapages()
170 c = l + ((r + 1 - l) // 2)
171 ls = self.alphapage(c)
172 if libalphacmp(ls[0].name, prefix) > 0:
174 elif libalphacmp(ls[-1].name, prefix) < 0:
182 if libalphacmp(m.name, prefix) >= 0:
188 if not m.name[:len(prefix)].upper() == prefix.upper():
193 ls = self.alphapage(pno)
197 raise NotImplementedError("mangafox iterator")