%PDF- %PDF-
Direktori : /lib/calibre/calibre/gui2/store/stores/ |
Current File : //lib/calibre/calibre/gui2/store/stores/empik_plugin.py |
# -*- coding: utf-8 -*- from __future__ import absolute_import, division, print_function, unicode_literals store_version = 9 # Needed for dynamic plugin loading __license__ = 'GPL 3' __copyright__ = '2011-2019, Tomasz Długosz <tomek3d@gmail.com>' __docformat__ = 'restructuredtext en' from base64 import b64encode from contextlib import closing try: from urllib.parse import quote except ImportError: from urllib import quote from lxml import html from qt.core import QUrl from calibre import browser, url_slash_cleaner from calibre.gui2 import open_url from calibre.gui2.store import StorePlugin from calibre.gui2.store.basic_config import BasicStoreConfig from calibre.gui2.store.search_result import SearchResult from calibre.gui2.store.web_store_dialog import WebStoreDialog def as_base64(data): if not isinstance(data, bytes): data = data.encode('utf-8') ans = b64encode(data) if isinstance(ans, bytes): ans = ans.decode('ascii') return ans class EmpikStore(BasicStoreConfig, StorePlugin): def open(self, parent=None, detail_item=None, external=False): aff_root = 'https://www.a4b-tracking.com/pl/stat-click-text-link/78/58/' url = 'https://www.empik.com/ebooki' aff_url = aff_root + as_base64(url) detail_url = None if detail_item: detail_url = aff_root + as_base64(detail_item) if external or self.config.get('open_external', False): open_url(QUrl(url_slash_cleaner(detail_url if detail_url else aff_url))) else: d = WebStoreDialog(self.gui, url, parent, detail_url if detail_url else aff_url) d.setWindowTitle(self.name) d.set_tags(self.config.get('tags', '')) d.exec() def search(self, query, max_results=10, timeout=60): url = 'https://www.empik.com/ebooki/ebooki,3501,s?sort=scoreDesc&resultsPP={}&q={}'.format(max_results, quote(query)) br = browser() counter = max_results with closing(br.open(url, timeout=timeout)) as f: doc = html.fromstring(f.read()) for data in doc.xpath('//div[@class="search-content js-search-content"]/div'): if counter <= 0: break id = ''.join(data.xpath('.//div[@class="name"]/a/@href')) if not id: continue cover_url = ''.join(data.xpath('.//a/img[@class="lazy"]/@lazy-img')) author = ', '.join(data.xpath('.//a[@class="smartAuthor"]/text()')) title = ''.join(data.xpath('.//div[@class="name"]/a/@title')) price = ''.join(data.xpath('.//div[@class="price ta-price-tile "]/text()')) # with closing(br.open('https://empik.com' + id.strip(), timeout=timeout/4)) as nf: # idata = html.fromstring(nf.read()) # crawled = idata.xpath('.//a[(@class="chosen hrefstyle") or (@class="connectionsLink hrefstyle")]/text()') # formats = ','.join([re.sub('ebook, ','', x.strip()) for x in crawled if 'ebook' in x]) counter -= 1 s = SearchResult() s.cover_url = cover_url s.title = title.split(' - ')[0] s.author = author.strip() s.price = price.strip() s.detail_item = 'https://empik.com' + id.strip() # s.formats = formats.upper().strip() yield s