-
Notifications
You must be signed in to change notification settings - Fork 2
/
javbus.py
65 lines (47 loc) · 1.29 KB
/
javbus.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
# -*- coding: utf-8 -*-
import ConfigParser
import requests
from bs4 import BeautifulSoup
class JavbusConfig:
url = 'https://www.javbus.com'
class ProxyConfig:
enabled = False
host = '127.0.0.1'
port = '1080'
protocol = 'socks5'
username = ''
password = ''
class CrawlerConfig:
javbus = None
proxy = None
class JavbusCrawler:
baseUrl = 'https://www.javbus.com'
def __init__(self, conf):
self.baseUrl = conf.javbus.url
def crawlActress(self):
return
def crawlActresses(self, page):
return
def crawlTags(self):
url = baseUrl + '/genre'
resp = requests.get(url)
html = resp.text
doc = BeautifulSoup(html, 'html5lib')
genreBoxes = doc.
return
def loadConfig():
# config = ConfigParser.ConfigParser()
# config.read('crawler.ini')
# config.get('javbus', 'url')
# config.get('proxy', 'host')
# config.get('proxy', 'port')
crawlerConfig = CrawlerConfig()
javbus = JavbusConfig()
javbus.url = 'https://www.busdmm.one'
proxy = ProxyConfig()
proxy.enabled = False
crawlerConfig.javbus = javbus
crawlerConfig.proxy = proxy
return crawlerConfig
if __name__ == '__main__':
conf = loadConfig()