binder.py 9.39 KB
Newer Older
1
# Tweepy
2
3
# Copyright 2009-2010 Joshua Roesslein
# See LICENSE for details.
4

Aaron Hill's avatar
Aaron Hill committed
5
import requests
Josh Roesslein's avatar
Josh Roesslein committed
6
import urllib
7
import time
8
import re
Mike's avatar
Mike committed
9
10
from StringIO import StringIO
import gzip
11

Josh Roesslein's avatar
Josh Roesslein committed
12
from tweepy.error import TweepError
13
from tweepy.utils import convert_to_utf8_str
14
from tweepy.models import Model
15

16
17
re_path_template = re.compile('{\w+}')

Josh Roesslein's avatar
Josh Roesslein committed
18

19
20
21
22
23
24
25
26
27
28
29
def bind_api(**config):

    class APIMethod(object):

        path = config['path']
        payload_type = config.get('payload_type', None)
        payload_list = config.get('payload_list', False)
        allowed_param = config.get('allowed_param', [])
        method = config.get('method', 'GET')
        require_auth = config.get('require_auth', False)
        search_api = config.get('search_api', False)
30
        use_cache = config.get('use_cache', True)
Aaron Hill's avatar
Aaron Hill committed
31
        session = requests.Session()
32
33
34
35
36
37
38
39
40
41
42
43

        def __init__(self, api, args, kargs):
            # If authentication is required and no credentials
            # are provided, throw an error.
            if self.require_auth and not api.auth:
                raise TweepError('Authentication required!')

            self.api = api
            self.post_data = kargs.pop('post_data', None)
            self.retry_count = kargs.pop('retry_count', api.retry_count)
            self.retry_delay = kargs.pop('retry_delay', api.retry_delay)
            self.retry_errors = kargs.pop('retry_errors', api.retry_errors)
44
            self.wait_on_rate_limit = kargs.pop('wait_on_rate_limit', api.wait_on_rate_limit)
Aaron Hill's avatar
Aaron Hill committed
45
            self.wait_on_rate_limit_notify = kargs.pop('wait_on_rate_limit_notify', api.wait_on_rate_limit_notify)
46
            self.parser = kargs.pop('parser', api.parser)
Aaron Hill's avatar
Aaron Hill committed
47
            self.session.headers = kargs.pop('headers', {})
48
49
50
51
52
53
54
55
56
57
            self.build_parameters(args, kargs)

            # Pick correct URL root to use
            if self.search_api:
                self.api_root = api.search_root
            else:
                self.api_root = api.api_root

            # Perform any path variable substitution
            self.build_path()
58

59
            if api.secure:
60
                self.scheme = 'https://'
61
            else:
62
63
64
65
                self.scheme = 'http://'

            if self.search_api:
                self.host = api.search_host
66
            else:
67
68
                self.host = api.host

69
70
71
            # Manually set Host header to fix an issue in python 2.5
            # or older where Host is set including the 443 port.
            # This causes Twitter to issue 301 redirect.
Pablo Castellano's avatar
Pablo Castellano committed
72
            # See Issue https://github.com/tweepy/tweepy/issues/12
Aaron Hill's avatar
Aaron Hill committed
73
74

            self.session.headers['Host'] = self.host
75
76
77
            # Monitoring rate limits
            self._remaining_calls = None
            self._reset_time = None
78

79
        def build_parameters(self, args, kargs):
Aaron Hill's avatar
Aaron Hill committed
80
            self.session.params = {}
81
            for idx, arg in enumerate(args):
82
83
                if arg is None:
                    continue
84
                try:
Aaron Hill's avatar
Aaron Hill committed
85
                    self.session.params[self.allowed_param[idx]] = convert_to_utf8_str(arg)
86
87
88
89
90
91
                except IndexError:
                    raise TweepError('Too many parameters supplied!')

            for k, arg in kargs.items():
                if arg is None:
                    continue
Aaron Hill's avatar
Aaron Hill committed
92
                if k in self.session.params:
93
94
                    raise TweepError('Multiple values for parameter %s supplied!' % k)

Aaron Hill's avatar
Aaron Hill committed
95
                self.session.params[k] = convert_to_utf8_str(arg)
96
97
98
99
100

        def build_path(self):
            for variable in re_path_template.findall(self.path):
                name = variable.strip('{}')

Aaron Hill's avatar
Aaron Hill committed
101
                if name == 'user' and 'user' not in self.session.params and self.api.auth:
102
103
104
105
                    # No 'user' parameter provided, fetch it from Auth instead.
                    value = self.api.auth.get_username()
                else:
                    try:
Aaron Hill's avatar
Aaron Hill committed
106
                        value = urllib.quote(self.session.params[name])
107
108
                    except KeyError:
                        raise TweepError('No parameter value found for path variable: %s' % name)
Aaron Hill's avatar
Aaron Hill committed
109
                    del self.session.params[name]
110

111
112
                self.path = self.path.replace(variable, value)

113
        def execute(self):
Joshua Roesslein's avatar
Joshua Roesslein committed
114
115
            self.api.cached_result = False

116
117
            # Build the request URL
            url = self.api_root + self.path
Aaron Hill's avatar
Aaron Hill committed
118
            full_url = self.scheme + self.host + url
119
120
121

            # Query the cache if one is available
            # and this request uses a GET method.
122
            if self.use_cache and self.api.cache and self.method == 'GET':
123
                cache_result = self.api.cache.get(url)
124
125
126
127
128
                # if cache result found and not expired, return it
                if cache_result:
                    # must restore api reference
                    if isinstance(cache_result, list):
                        for result in cache_result:
129
130
                            if isinstance(result, Model):
                                result._api = self.api
131
                    else:
132
133
                        if isinstance(cache_result, Model):
                            cache_result._api = self.api
Joshua Roesslein's avatar
Joshua Roesslein committed
134
                    self.api.cached_result = True
135
136
137
138
139
140
                    return cache_result

            # Continue attempting request until successful
            # or maximum number of retries is reached.
            retries_performed = 0
            while retries_performed < self.retry_count + 1:
141
142
143
144
145
                # handle running out of api calls
                if self.wait_on_rate_limit and self._reset_time is not None and \
                   self._remaining_calls is not None and self._remaining_calls < 1:
                    sleep_time = self._reset_time - int(time.time())
                    if sleep_time > 0:
146
147
148
149
                        if self.wait_on_rate_limit_notify:
                            print "Max retries reached. Sleeping for: " + str(sleep_time)
                        time.sleep(sleep_time + 5) # sleep for few extra sec

150
151
                # Apply authentication
                if self.api.auth:
Aaron Hill's avatar
Aaron Hill committed
152
                    auth = self.api.auth.apply_auth()
153

Mike's avatar
Mike committed
154
155
                # Request compression if configured
                if self.api.compression:
Aaron Hill's avatar
Aaron Hill committed
156
                    self.session.headers['Accept-encoding'] = 'gzip'
Mike's avatar
Mike committed
157

158
159
                # Execute request
                try:
Aaron Hill's avatar
Aaron Hill committed
160
161
162
                    resp = self.session.request(self.method, full_url,
                            data=self.post_data, timeout=self.api.timeout,
                            auth=auth)
Aaron Hill's avatar
Aaron Hill committed
163
                except Exception, e:
164
                    raise TweepError('Failed to send request: %s' % e)
165
166
                rem_calls = resp.getheader('x-rate-limit-remaining')
                if rem_calls is not None:
167
                    self._remaining_calls = int(rem_calls)
168
169
170
171
                elif isinstance(self._remaining_calls, int):
                    self._remaining_calls -= 1
                reset_time = resp.getheader('x-rate-limit-reset')
                if reset_time is not None:
172
                    self._reset_time = int(reset_time)
173
                if self.wait_on_rate_limit and self._remaining_calls == 0 and (resp.status == 429 or resp.status == 420): # if ran out of calls before waiting switching retry last call
174
                    continue
175
                retry_delay = self.retry_delay
176
                # Exit request loop if non-retry error code
Aaron Hill's avatar
Aaron Hill committed
177
                if resp.status_code == 200:
178
                    break
Aaron Hill's avatar
Aaron Hill committed
179
180
181
182
                elif (resp.status_code == 429 or resp.status_code == 420) and self.wait_on_rate_limit:
                    if 'retry-after' in resp.headers:
                        retry_delay = float(resp.headers['retry-after'])
                elif self.retry_errors and resp.status_code not in self.retry_errors:
183
                    break
184

185
                # Sleep before retrying request again
186
                time.sleep(retry_delay)
187
                retries_performed += 1
Josh Roesslein's avatar
Josh Roesslein committed
188

189
            self.session = requests.Session()
190
191
            # If an error was returned, throw an exception
            self.api.last_response = resp
192
            if resp.status_code and not 200 <= resp.status_code < 300:
193
                try:
Aaron Hill's avatar
Aaron Hill committed
194
                    error_msg = self.parser.parse_error(resp.text)
195
                except Exception:
Aaron Hill's avatar
Aaron Hill committed
196
                    error_msg = "Twitter error response: status code = %s" % resp.status_code
197
                raise TweepError(error_msg, resp)
198
199

            # Parse the response payload
Aaron Hill's avatar
Aaron Hill committed
200
201
            body = resp.text
            if resp.headers.get('Content-Encoding', '') == 'gzip':
Mike's avatar
Mike committed
202
203
204
                try:
                    zipper = gzip.GzipFile(fileobj=StringIO(body))
                    body = zipper.read()
205
                except Exception as e:
Mike's avatar
Mike committed
206
                    raise TweepError('Failed to decompress data: %s' % e)
207
208
            
            result = self.parser.parse(self, body)
209
210

            # Store result into cache if one is available.
211
            if self.use_cache and self.api.cache and self.method == 'GET' and result:
212
                self.api.cache.store(url, result)
213

214
            return result
Josh Roesslein's avatar
Josh Roesslein committed
215

Aaron Hill's avatar
Aaron Hill committed
216
    def _call(api, *args, **kargs):
217
218

        method = APIMethod(api, args, kargs)
Aaron Hill's avatar
Aaron Hill committed
219
        if kargs.get('create'):
220
221
222
            return method
        else:
            return method.execute()
Josh Roesslein's avatar
Josh Roesslein committed
223

224
    # Set pagination mode
225
    if 'cursor' in APIMethod.allowed_param:
226
        _call.pagination_mode = 'cursor'
227
228
229
    elif 'max_id' in APIMethod.allowed_param and \
         'since_id' in APIMethod.allowed_param:
        _call.pagination_mode = 'id'
230
    elif 'page' in APIMethod.allowed_param:
231
        _call.pagination_mode = 'page'
232

Josh Roesslein's avatar
Josh Roesslein committed
233
    return _call