pipenv shell
cd appstore_crawler
export LANG=en_US.utf8 # to avoid ParserError
run one category
# set category
CATEGORY=photo-video
# this example will crawl urls includes /genre/ios-{category}# i.e. https://apps.apple.com/us/genre/ios-photo-video/id6008
scrapy crawl appstore \
-a category=${CATEGORY} \
-s JOBDIR=crawls/${CATEGORY}-1 # update this number or delete the dir
fromPILimportImageimportnumpyasnpicon=Image.open('appstore_crawler/icondata/photo-video/1006639052.png')
img=np.array(icon, 'f')
print(img.dtype) # dtype('float32')print(img.shape) # (246, 246, 3)# NOTE: the order is RGB (c.f. OpenCV is BGR)
# for example Evernote
scrapy shell https://apps.apple.com/us/app/evernote/id281796108
# another example Dropbox
scrapy shell https://apps.apple.com/us/app/dropbox/id327630330
(reference) command log of initial setup
export PIPENV_VENV_IN_PROJECT=true
pipenv --python 3.6
pipenv install scrapy tqdm python-dateutil pandas
pipenv run pip list
pipenv graph