scrapy.cfg 1.09 KB
# Automatically created by: scrapy startproject
#
# For more information about the [deploy] section see:
# http://doc.scrapy.org/en/latest/topics/scrapyd.html

[settings]
default = mspider.settings

[deploy]
#url = http://localhost:6800/

project = mspider

[custom]
## N.B.:
## NO trailing comma or single quote is allowed!
## e.g.
## start_urls = ["http://image.baidu.com/","http://v.baidu.com/"]
## allowed_domains = ["baidu.com", "bdstatic.com"]
## cookies = {"userid" : "kitt232qsh", "BAIDUID":"3E4101AB69C6EDBDE3A677BC7B8F0794", "BAIDUPSID" : "3E4101AB69C6EDBDE3A677BC7B8F0794"}
## regexes = ["http://image.baidu.com/channel\\S+", "http://image.baidu.com/channel\\S+"]

start_urls = ["http://image.baidu.com/","http://v.baidu.com/"]
allowed_domains = ["baidu.com", "bdstatic.com"]
cookies = {"userid" : "kitt232qsh", "BAIDUID":"3E4101AB69C6EDBDE3A677BC7B8F0794", "BAIDUPSID" : "3E4101AB69C6EDBDE3A677BC7B8F0794"}
regexes = ["http://image.baidu.com/channel\\S+", "http://image.baidu.com/channel\\S+"]
xpaths = ["//img[contains(@src,'jpg') and (contains(@src,'hiphotos') or contains(@src,'bdstatic'))]/@src"]