前言
最近在搞自動購買的東西,然後就扯到json了,
後來發現我沒有對json做一個懶人程式碼包。
def start_requests(self):
source_url = "...."
for keyword in self.db.wishList.find ({},{ "name" :1 , "_id" : 0 ,"quote":1 } ):
self.log(keyword['name'])
#self.log("urlencode::: " + urlparse.quote(keyword['name']))
start_url = source_url + urlparse.quote(keyword['name'])
yield scrapy.Request(start_url,self.parse,meta={"favorite":keyword['quote']})
def parse(self, response):
#le = LinkExtractor(restrict_css='div.panel-default>a.list-group-item')
#指到二手書列表
#self.log("source_url_link is ===" + response.url)
self.log("favorite: "+ response.meta.get('favorite'))
sudo vim /usr/bin/pip3
from pip import main
if __name__ == '__main__':
sys.exit(main())
from pip import __main__
if __name__ == '__main__':
sys.exit(__main__._main())
建立環境
conda create -n envName
conda create -n envName python=3
進入環境
source activate envName #在base底下要切換的話用這組
conda activate envName #通常用這組可以通吃
安裝套件
conda install packageName
套件列表
conda list
離開環境
conda deactivate
#ubuntu只顯示資料夾
ls -d */
pip3 search <package> 搜尋套件
pip3 install <package> 安裝套件
pip3 uninstall <package> 移除套件
pip3 list 套件列表
pip3 list –outdated 檢查有無升級
pip3 install –U|—upgrade <package> 軟體更新包
pip3 –version pip3 版本資訊
sudo pip3 install –upgrade pip 升級pip自己
將目前的套件存成文字檔後匯入
pip3 freeze > aa.txt
pip3 install –r aa.txt
scrapy startproject scrapy_spider
import scrapy
class booksSpider(scrapy.Spider):
name = "books"
allowed_domains = ["books.com.tw"]
start_urls = [
"http://www.books.com.tw/products/0010789024"
]
def parse(self, response):
filename = response.url.split("/")[-2]
with open(filename, 'wb') as f:
f.write(response.body)
scrapy crawl books
如果出現 no active project,Unknown command: crawl,Use "scrapy" to see available commands
scrapy crawl books -o aa.csv
conda create -n envName
activate envName
conda env remove –n envName
conda env list
conda install packageName
conda list
conda remove packageName
deactivate