[2/n] click-ify - add 2_dump_detail command
run with poetry run python main.py --step dump_detail
This commit is contained in:
parent
90b531f5d9
commit
c2196c15c1
2 changed files with 31 additions and 21 deletions
|
|
@ -4,28 +4,36 @@ from tqdm import tqdm
|
||||||
|
|
||||||
from data_access import Listing
|
from data_access import Listing
|
||||||
|
|
||||||
incremental = True
|
|
||||||
|
def dump_detail():
|
||||||
|
incremental = True
|
||||||
|
listings = Listing.get_all_listings()
|
||||||
|
filtered_listings = []
|
||||||
|
for listing in listings:
|
||||||
|
# We introduced last_seen later, so not all entries have it.
|
||||||
|
# If it doesnt exist then its on the platform anymore. So skip
|
||||||
|
last_seen = listing.last_seen
|
||||||
|
if last_seen is None:
|
||||||
|
continue
|
||||||
|
|
||||||
|
if not incremental and last_seen <= 1:
|
||||||
|
filtered_listings.append(listing)
|
||||||
|
|
||||||
|
if incremental and not listing.path_detail_json().exists():
|
||||||
|
filtered_listings.append(listing)
|
||||||
|
|
||||||
|
for listing in tqdm(filtered_listings):
|
||||||
|
try:
|
||||||
|
d = detail_query(listing.identifier)
|
||||||
|
with open(listing.path_detail_json(), "w") as f:
|
||||||
|
json.dump(d, f)
|
||||||
|
except Exception as e:
|
||||||
|
print(e)
|
||||||
|
|
||||||
|
|
||||||
listings = Listing.get_all_listings()
|
def main():
|
||||||
filtered_listings = []
|
dump_detail()
|
||||||
for listing in listings:
|
|
||||||
# We introduced last_seen later, so not all entries have it.
|
|
||||||
# If it doesnt exist then its on the platform anymore. So skip
|
|
||||||
last_seen = listing.last_seen
|
|
||||||
if last_seen is None:
|
|
||||||
continue
|
|
||||||
|
|
||||||
if not incremental and last_seen <= 1:
|
|
||||||
filtered_listings.append(listing)
|
|
||||||
|
|
||||||
if incremental and not listing.path_detail_json().exists():
|
if __name__ == "__main__":
|
||||||
filtered_listings.append(listing)
|
main()
|
||||||
|
|
||||||
for listing in tqdm(filtered_listings):
|
|
||||||
try:
|
|
||||||
d = detail_query(listing.identifier)
|
|
||||||
with open(listing.path_detail_json(), "w") as f:
|
|
||||||
json.dump(d, f)
|
|
||||||
except Exception as e:
|
|
||||||
print(e)
|
|
||||||
|
|
|
||||||
|
|
@ -2,9 +2,11 @@ import click
|
||||||
import importlib
|
import importlib
|
||||||
|
|
||||||
dump_listings_module = importlib.import_module('1_dump_listings')
|
dump_listings_module = importlib.import_module('1_dump_listings')
|
||||||
|
dump_detail_module = importlib.import_module('2_dump_detail')
|
||||||
|
|
||||||
steps_to_handlers = {
|
steps_to_handlers = {
|
||||||
'dump_listings': dump_listings_module.dump_listings,
|
'dump_listings': dump_listings_module.dump_listings,
|
||||||
|
'dump_detail': dump_detail_module.dump_detail,
|
||||||
}
|
}
|
||||||
|
|
||||||
|
|
||||||
|
|
|
||||||
Loading…
Add table
Add a link
Reference in a new issue