Scrape more metadata

The script now scrapes category, type, species and gender as well
This commit is contained in:
Xerbo 2020-04-09 18:23:32 +01:00
parent 972dacb5bd
commit c6da43bf66

View file

@ -91,6 +91,10 @@ def download_file(path):
'title': title,
'description': s.find(class_='submission-description').text.strip().replace('\r\n', '\n'),
"tags": [],
'category': s.find(class_='info').find(class_='category-name').text,
'type': s.find(class_='info').find(class_='type-name').text,
'species': s.find(class_='info').findAll('div')[2].find('span').text,
'gender': s.find(class_='info').findAll('div')[3].find('span').text,
'views': int(s.find(class_='views').find(class_='font-large').text),
'favorites': int(s.find(class_='favorites').find(class_='font-large').text),
'rating': s.find(class_='rating-box').text.strip(),
@ -170,4 +174,4 @@ while True:
page_num += 1
print('Downloading page', page_num)
print('Finished downloading')
print('Finished downloading')