-
Notifications
You must be signed in to change notification settings - Fork 1
/
Copy pathspreadsheet.py
156 lines (135 loc) · 5.03 KB
/
spreadsheet.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
#!/usr/bin/env python
# Class for common Google sheet operations.
import os
import sys
import json
import doctest
import csv
import gspread
import string
from oauth2client.client import SignedJwtAssertionCredentials
from collections import defaultdict
try:
from collections import OrderedDict
except ImportError:
# python 2.6 or earlier, use backport
from ordereddict import OrderedDict
import argparse
class Sheet:
""" Handle google spreadsheet read and flatfile write operations.
>>> sheet = Sheet('test-sheet', 'worksheet-name')
>>> sheet.publish()
True
"""
def __init__(self, sheet_name, worksheet=None):
self.options = None
self.directory = os.path.dirname(os.path.realpath(__file__))
if not os.path.isdir('%s/output' % self.directory):
os.mkdir('%s/output' % self.directory)
scope = ['https://spreadsheets.google.com/feeds']
self.credentials = SignedJwtAssertionCredentials(
os.environ.get('ACCOUNT_USER'),
string.replace(os.environ.get('ACCOUNT_KEY'), "\\n", "\n"),
scope)
self.spread = gspread.authorize(self.credentials)
self.sheet_name = sheet_name
self.filters = None
if worksheet:
self.open_worksheet(worksheet)
self.worksheet = worksheet
def set_options(self, options):
""" Set the objects options var.
"""
self.options = options
return options
def slugify(self, slug):
return slug.lower().replace(' ', '-')
def add_filter(self, key, value):
""" Add a filter we will parse the spreadsheet by. Key should match
a key in the spreadsheet (capitalization matters).
>>> sheet = Sheet('test-sheet', 'worksheet-name')
>>> sheet.add_filter('name', 'test')
True
>>> sheet.filters
[{'value': 'test', 'key': 'name'}]
"""
if self.filters:
self.filters.append({'key': key, 'value': value})
else:
self.filters = [{'key': key, 'value': value}]
return True
def build_filename(self):
""" Put together the name of the file we're writing. This is based
on the worksheet name and any filters.
>>> sheet = Sheet('test-sheet', 'worksheet-name')
>>> sheet.add_filter('name', 'test')
True
>>> sheet.build_filename()
True
>>> sheet.filename
'worksheet-name-test'
"""
filter_string = ''
if self.filters:
filter_string += '-'
for item in self.filters:
filter_string += self.slugify(item['value'])
self.filename = '%s%s' % (self.worksheet, filter_string)
return True
def open_worksheet(self, worksheet):
""" Open a spreadsheet, return a sheet object.
>>> sheet = Sheet('test-sheet')
>>> sheet.open_worksheet('worksheet-name')
<Worksheet 'worksheet-name' id:od6>
"""
self.sheet = self.spread.open(self.sheet_name).worksheet(worksheet)
return self.sheet
def publish(self, worksheet=None):
""" Publish the data in whatever permutations we need.
This assumes the spreadsheet's key names are in the first row.
>>> sheet = Sheet('test-sheet', 'worksheet-name')
>>> sheet.publish()
True
"""
if not self.sheet or worksheet:
self.sheet = self.open_worksheet(worksheet)
if not worksheet:
worksheet = self.worksheet
self.build_filename()
rows = self.sheet.get_all_values()
keys = rows[0]
fn = {
'json': open('%s/output/%s.json' % (self.directory, self.filename), 'wb'),
'csv': open('%s/output/%s.csv' % (self.directory, self.filename), 'wb')
}
recordwriter = csv.writer(
fn['csv'], delimiter=',', quotechar='"', quoting=csv.QUOTE_MINIMAL)
records = []
for i, row in enumerate(rows):
if i == 0:
keys = row
recordwriter.writerow(keys)
continue
record = OrderedDict(zip(keys, row))
recordwriter.writerow(row)
records += [record]
if records:
json.dump(records, fn['json'])
return True
def main(args):
""" Take args as key=value pairs, pass them to the add_filter method.
Example command:
$ python spreadsheet.py City=Denver
"""
sheet = Sheet('Sports', 'broncos-sacks-2015')
sheet.set_options(args)
sheet.publish()
if __name__ == '__main__':
parser = argparse.ArgumentParser(usage='$ python spreadsheet.py',
description='',
epilog='')
parser.add_argument("-v", "--verbose", dest="verbose", default=False, action="store_true")
args = parser.parse_args()
if args.verbose:
doctest.testmod(verbose=args.verbose)
main(args)