diff options
Diffstat (limited to 'to_csv.py')
-rw-r--r-- | to_csv.py | 30 |
1 files changed, 30 insertions, 0 deletions
diff --git a/to_csv.py b/to_csv.py new file mode 100644 index 0000000..f742cc2 --- /dev/null +++ b/to_csv.py @@ -0,0 +1,30 @@ +import csv +from mgs import MGSPiracy +from argparse import ArgumentParser + +if __name__ == '__main__': + # parse arguments + argp = ArgumentParser() + argp.add_argument('--output', type=str, default='output.csv', help='CSV output file name') + argp.add_argument('--from', type=int, default=0, help='First page', dest='_from') + argp.add_argument('--to', type=int, default=10, help='Last page') + args = argp.parse_args() + + # get cases + mgs = MGSPiracy(from_page=args._from, to_page=args.to) + cases = mgs.get_cases() + + # write to csv + f = open(args.output, 'w', newline='') + csv_writer = csv.writer(f) + + for case in cases: + csv_writer.writerow(( + case['date'], + case['statement_number'], + case['applicant'], + case['object'], + case['doc_link'], + case['violation_links'])) + + f.close()
\ No newline at end of file |