1 | /* |
---|
2 | * This file Copyright (C) 2008-2010 Mnemosyne LLC |
---|
3 | * |
---|
4 | * This file is licensed by the GPL version 2. Works owned by the |
---|
5 | * Transmission project are granted a special exemption to clause 2(b) |
---|
6 | * so that the bulk of its code can remain under the MIT license. |
---|
7 | * This exemption does not extend to derived works not owned by |
---|
8 | * the Transmission project. |
---|
9 | * |
---|
10 | * $Id: web.c 10232 2010-02-19 17:08:13Z charles $ |
---|
11 | */ |
---|
12 | |
---|
13 | #include <assert.h> |
---|
14 | |
---|
15 | #include <curl/curl.h> |
---|
16 | #include <event.h> |
---|
17 | #include <evdns.h> |
---|
18 | |
---|
19 | #include "transmission.h" |
---|
20 | #include "net.h" |
---|
21 | #include "ptrarray.h" |
---|
22 | #include "session.h" |
---|
23 | #include "trevent.h" |
---|
24 | #include "utils.h" |
---|
25 | #include "version.h" |
---|
26 | #include "web.h" |
---|
27 | |
---|
28 | enum |
---|
29 | { |
---|
30 | TR_MEMORY_TRASH = 0xCC, |
---|
31 | |
---|
32 | DEFAULT_TIMER_MSEC = 250, /* arbitrary */ |
---|
33 | |
---|
34 | MIN_DNS_CACHE_TIME = 60 * 60 * 24 |
---|
35 | }; |
---|
36 | |
---|
37 | #if 0 |
---|
38 | #define dbgmsg(...) \ |
---|
39 | do { \ |
---|
40 | fprintf( stderr, __VA_ARGS__ ); \ |
---|
41 | fprintf( stderr, "\n" ); \ |
---|
42 | } while( 0 ) |
---|
43 | #else |
---|
44 | #define dbgmsg( ... ) \ |
---|
45 | do { \ |
---|
46 | if( tr_deepLoggingIsActive( ) ) \ |
---|
47 | tr_deepLog( __FILE__, __LINE__, "web", __VA_ARGS__ ); \ |
---|
48 | } while( 0 ) |
---|
49 | #endif |
---|
50 | |
---|
51 | /*** |
---|
52 | **** |
---|
53 | ***/ |
---|
54 | |
---|
55 | struct tr_web |
---|
56 | { |
---|
57 | tr_bool closing; |
---|
58 | tr_bool haveAddr; |
---|
59 | int taskCount; |
---|
60 | long timer_msec; |
---|
61 | CURLM * multi; |
---|
62 | tr_session * session; |
---|
63 | tr_address addr; |
---|
64 | tr_ptrArray dns_cache; |
---|
65 | struct event timer_event; |
---|
66 | }; |
---|
67 | |
---|
68 | struct dns_cache_item; |
---|
69 | static void dns_cache_item_free( struct dns_cache_item * ); |
---|
70 | |
---|
71 | static void |
---|
72 | web_free( tr_web * g ) |
---|
73 | { |
---|
74 | evdns_shutdown( TRUE ); |
---|
75 | curl_multi_cleanup( g->multi ); |
---|
76 | evtimer_del( &g->timer_event ); |
---|
77 | tr_ptrArrayDestruct( &g->dns_cache, (PtrArrayForeachFunc)dns_cache_item_free ); |
---|
78 | memset( g, TR_MEMORY_TRASH, sizeof( struct tr_web ) ); |
---|
79 | tr_free( g ); |
---|
80 | } |
---|
81 | |
---|
82 | /*** |
---|
83 | **** |
---|
84 | ***/ |
---|
85 | |
---|
86 | struct tr_web_task |
---|
87 | { |
---|
88 | int port; |
---|
89 | unsigned long tag; |
---|
90 | struct curl_slist * slist; |
---|
91 | struct evbuffer * response; |
---|
92 | char * url; |
---|
93 | char * resolved_url; |
---|
94 | char * host; |
---|
95 | const char * resolved_host; |
---|
96 | char * range; |
---|
97 | tr_session * session; |
---|
98 | tr_web_done_func * done_func; |
---|
99 | void * done_func_user_data; |
---|
100 | struct event timer_event; |
---|
101 | CURL * easy; |
---|
102 | CURLM * multi; |
---|
103 | tr_bool timer_event_isSet; |
---|
104 | }; |
---|
105 | |
---|
106 | static void |
---|
107 | task_free( struct tr_web_task * task ) |
---|
108 | { |
---|
109 | if( task->slist != NULL ) |
---|
110 | curl_slist_free_all( task->slist ); |
---|
111 | if( task->timer_event_isSet ) |
---|
112 | evtimer_del( &task->timer_event ); |
---|
113 | evbuffer_free( task->response ); |
---|
114 | tr_free( task->host ); |
---|
115 | tr_free( task->range ); |
---|
116 | tr_free( task->resolved_url ); |
---|
117 | tr_free( task->url ); |
---|
118 | memset( task, TR_MEMORY_TRASH, sizeof( struct tr_web_task ) ); |
---|
119 | tr_free( task ); |
---|
120 | } |
---|
121 | |
---|
122 | /*** |
---|
123 | **** |
---|
124 | ***/ |
---|
125 | |
---|
126 | struct dns_cache_item |
---|
127 | { |
---|
128 | char * host; |
---|
129 | char * resolved_host; |
---|
130 | time_t expiration; |
---|
131 | tr_bool success; |
---|
132 | }; |
---|
133 | |
---|
134 | static void |
---|
135 | dns_cache_item_free( struct dns_cache_item * item ) |
---|
136 | { |
---|
137 | if( item != NULL ) |
---|
138 | { |
---|
139 | tr_free( item->host ); |
---|
140 | tr_free( item->resolved_host ); |
---|
141 | memset( item, TR_MEMORY_TRASH, sizeof( struct dns_cache_item ) ); |
---|
142 | tr_free( item ); |
---|
143 | } |
---|
144 | } |
---|
145 | |
---|
146 | static int |
---|
147 | dns_cache_compare( const void * va, const void * vb ) |
---|
148 | { |
---|
149 | const struct dns_cache_item * a = va; |
---|
150 | const struct dns_cache_item * b = vb; |
---|
151 | return strcmp( a->host, b->host ); |
---|
152 | } |
---|
153 | |
---|
154 | typedef enum |
---|
155 | { |
---|
156 | TR_DNS_OK, |
---|
157 | TR_DNS_FAIL, |
---|
158 | TR_DNS_UNTESTED |
---|
159 | } |
---|
160 | tr_dns_result; |
---|
161 | |
---|
162 | static void |
---|
163 | dns_cache_clear_entry( struct tr_ptrArray * cache, const char * host ) |
---|
164 | { |
---|
165 | struct dns_cache_item key; |
---|
166 | key.host = (char*) host; |
---|
167 | dns_cache_item_free( tr_ptrArrayRemoveSorted( cache, &key, dns_cache_compare ) ); |
---|
168 | } |
---|
169 | |
---|
170 | static tr_dns_result |
---|
171 | dns_cache_lookup( struct tr_web_task * task, const char * host, const char ** resolved ) |
---|
172 | { |
---|
173 | tr_dns_result result = TR_DNS_UNTESTED; |
---|
174 | |
---|
175 | if( task->session->web != NULL ) |
---|
176 | { |
---|
177 | struct dns_cache_item key; |
---|
178 | struct dns_cache_item * item; |
---|
179 | tr_ptrArray * cache = &task->session->web->dns_cache; |
---|
180 | |
---|
181 | key.host = (char*) host; |
---|
182 | item = tr_ptrArrayFindSorted( cache, &key, dns_cache_compare ); |
---|
183 | |
---|
184 | /* has the ttl expired? */ |
---|
185 | if( ( item != NULL ) && ( item->expiration <= tr_time( ) ) ) |
---|
186 | { |
---|
187 | dns_cache_clear_entry( cache, host ); |
---|
188 | item = NULL; |
---|
189 | } |
---|
190 | |
---|
191 | if( item != NULL ) |
---|
192 | { |
---|
193 | result = item->success ? TR_DNS_OK : TR_DNS_FAIL; |
---|
194 | |
---|
195 | if( result == TR_DNS_OK ) |
---|
196 | { |
---|
197 | *resolved = item->resolved_host; |
---|
198 | |
---|
199 | dbgmsg( "found cached dns entry for \"%s\": %s", host, *resolved ); |
---|
200 | } |
---|
201 | } |
---|
202 | } |
---|
203 | |
---|
204 | return result; |
---|
205 | } |
---|
206 | |
---|
207 | static void |
---|
208 | dns_cache_set_fail( struct tr_web_task * task, const char * host ) |
---|
209 | { |
---|
210 | if( task->session->web != NULL ) |
---|
211 | { |
---|
212 | struct dns_cache_item * item; |
---|
213 | tr_ptrArray * cache = &task->session->web->dns_cache; |
---|
214 | |
---|
215 | dns_cache_clear_entry( cache, host ); |
---|
216 | |
---|
217 | item = tr_new( struct dns_cache_item, 1 ); |
---|
218 | item->host = tr_strdup( host ); |
---|
219 | item->resolved_host = NULL; |
---|
220 | item->expiration = tr_time( ) + MIN_DNS_CACHE_TIME; |
---|
221 | item->success = FALSE; |
---|
222 | tr_ptrArrayInsertSorted( cache, item, dns_cache_compare ); |
---|
223 | } |
---|
224 | } |
---|
225 | |
---|
226 | static const char* |
---|
227 | dns_cache_set_name( struct tr_web_task * task, const char * host, |
---|
228 | const char * resolved, int ttl ) |
---|
229 | { |
---|
230 | char * ret = NULL; |
---|
231 | |
---|
232 | ttl = MAX( MIN_DNS_CACHE_TIME, ttl ); |
---|
233 | |
---|
234 | if( task->session->web != NULL ) |
---|
235 | { |
---|
236 | struct dns_cache_item * item; |
---|
237 | tr_ptrArray * cache = &task->session->web->dns_cache; |
---|
238 | |
---|
239 | dns_cache_clear_entry( cache, host ); |
---|
240 | |
---|
241 | item = tr_new( struct dns_cache_item, 1 ); |
---|
242 | item->host = tr_strdup( host ); |
---|
243 | item->resolved_host = tr_strdup( resolved ); |
---|
244 | item->expiration = tr_time( ) + ttl; |
---|
245 | item->success = TRUE; |
---|
246 | tr_ptrArrayInsertSorted( cache, item, dns_cache_compare ); |
---|
247 | ret = item->resolved_host; |
---|
248 | dbgmsg( "adding dns cache entry for \"%s\": %s", host, resolved ); |
---|
249 | } |
---|
250 | return ret; |
---|
251 | } |
---|
252 | |
---|
253 | /*** |
---|
254 | **** |
---|
255 | ***/ |
---|
256 | |
---|
257 | static size_t |
---|
258 | writeFunc( void * ptr, size_t size, size_t nmemb, void * vtask ) |
---|
259 | { |
---|
260 | const size_t byteCount = size * nmemb; |
---|
261 | struct tr_web_task * task = vtask; |
---|
262 | evbuffer_add( task->response, ptr, byteCount ); |
---|
263 | dbgmsg( "wrote %zu bytes to task %p's buffer", byteCount, task ); |
---|
264 | return byteCount; |
---|
265 | } |
---|
266 | |
---|
267 | static int |
---|
268 | sockoptfunction( void * vtask, curl_socket_t fd, curlsocktype purpose UNUSED ) |
---|
269 | { |
---|
270 | struct tr_web_task * task = vtask; |
---|
271 | const tr_bool isScrape = strstr( task->url, "scrape" ) != NULL; |
---|
272 | const tr_bool isAnnounce = strstr( task->url, "announce" ) != NULL; |
---|
273 | |
---|
274 | /* announce and scrape requests have tiny payloads. */ |
---|
275 | if( isScrape || isAnnounce ) |
---|
276 | { |
---|
277 | const int sndbuf = 1024; |
---|
278 | const int rcvbuf = isScrape ? 2048 : 3072; |
---|
279 | setsockopt( fd, SOL_SOCKET, SO_SNDBUF, &sndbuf, sizeof(sndbuf) ); |
---|
280 | setsockopt( fd, SOL_SOCKET, SO_RCVBUF, &rcvbuf, sizeof(rcvbuf) ); |
---|
281 | } |
---|
282 | |
---|
283 | /* return nonzero if this function encountered an error */ |
---|
284 | return 0; |
---|
285 | } |
---|
286 | |
---|
287 | static int |
---|
288 | getCurlProxyType( tr_proxy_type t ) |
---|
289 | { |
---|
290 | if( t == TR_PROXY_SOCKS4 ) return CURLPROXY_SOCKS4; |
---|
291 | if( t == TR_PROXY_SOCKS5 ) return CURLPROXY_SOCKS5; |
---|
292 | return CURLPROXY_HTTP; |
---|
293 | } |
---|
294 | |
---|
295 | static int |
---|
296 | getTimeoutFromURL( const char * url ) |
---|
297 | { |
---|
298 | if( strstr( url, "scrape" ) != NULL ) return 30; |
---|
299 | if( strstr( url, "announce" ) != NULL ) return 120; |
---|
300 | return 240; |
---|
301 | } |
---|
302 | |
---|
303 | static void task_timeout_cb( int fd UNUSED, short what UNUSED, void * task ); |
---|
304 | static void task_finish( struct tr_web_task * task, long response_code ); |
---|
305 | |
---|
306 | static void |
---|
307 | addTask( void * vtask ) |
---|
308 | { |
---|
309 | struct tr_web_task * task = vtask; |
---|
310 | const tr_session * session = task->session; |
---|
311 | |
---|
312 | if( ( session == NULL ) || ( session->web == NULL ) ) |
---|
313 | return; |
---|
314 | |
---|
315 | if( !task->resolved_host ) |
---|
316 | { |
---|
317 | dbgmsg( "couldn't resolve host for \"%s\"... task failed", task->url ); |
---|
318 | task_finish( task, 0 ); |
---|
319 | } |
---|
320 | else |
---|
321 | { |
---|
322 | CURL * e = curl_easy_init( ); |
---|
323 | struct tr_web * web = session->web; |
---|
324 | const int timeout = getTimeoutFromURL( task->url ); |
---|
325 | const long verbose = getenv( "TR_CURL_VERBOSE" ) != NULL; |
---|
326 | const char * user_agent = TR_NAME "/" SHORT_VERSION_STRING; |
---|
327 | |
---|
328 | /* insert the resolved host into the URL s.t. curl's DNS won't block |
---|
329 | * even if -- like on most OSes -- it wasn't built with C-Ares :( |
---|
330 | * "http://www.craptrackular.org/announce?key=val&key2=..." becomes |
---|
331 | * "http://127.0.0.1/announce?key=val&key2=..." */ |
---|
332 | { |
---|
333 | char * host; |
---|
334 | struct evbuffer * buf = evbuffer_new( ); |
---|
335 | char * pch = strstr( task->url, task->host ); |
---|
336 | char * tail = pch + strlen( task->host ); |
---|
337 | evbuffer_add( buf, task->url, pch - task->url ); |
---|
338 | evbuffer_add_printf( buf, "%s", task->resolved_host ); |
---|
339 | evbuffer_add_printf( buf, "%s", tail ); |
---|
340 | task->resolved_url = tr_strndup( EVBUFFER_DATA( buf ), EVBUFFER_LENGTH( buf ) ); |
---|
341 | dbgmsg( "old url: \"%s\" -- new url: \"%s\"", task->url, task->resolved_url ); |
---|
342 | evbuffer_free( buf ); |
---|
343 | |
---|
344 | /* Manually add a Host: argument that refers to the true URL */ |
---|
345 | if( ( ( task->port <= 0 ) ) || |
---|
346 | ( ( task->port == 80 ) && !strncmp( task->url, "http://", 7 ) ) || |
---|
347 | ( ( task->port == 443 ) && !strncmp( task->url, "https://", 8 ) ) ) |
---|
348 | host = tr_strdup_printf( "Host: %s", task->host ); |
---|
349 | else |
---|
350 | host = tr_strdup_printf( "Host: %s:%d", task->host, task->port ); |
---|
351 | |
---|
352 | task->slist = curl_slist_append( NULL, host ); |
---|
353 | task->slist = curl_slist_append( task->slist, "Accept:" ); |
---|
354 | curl_easy_setopt( e, CURLOPT_HTTPHEADER, task->slist ); |
---|
355 | tr_free( host ); |
---|
356 | } |
---|
357 | |
---|
358 | dbgmsg( "adding task #%lu [%s]", task->tag, task->resolved_url ? task->resolved_url : task->url ); |
---|
359 | |
---|
360 | if( !task->range && session->isProxyEnabled ) { |
---|
361 | curl_easy_setopt( e, CURLOPT_PROXY, session->proxy ); |
---|
362 | curl_easy_setopt( e, CURLOPT_PROXYAUTH, CURLAUTH_ANY ); |
---|
363 | curl_easy_setopt( e, CURLOPT_PROXYPORT, session->proxyPort ); |
---|
364 | curl_easy_setopt( e, CURLOPT_PROXYTYPE, |
---|
365 | getCurlProxyType( session->proxyType ) ); |
---|
366 | } |
---|
367 | if( !task->range && session->isProxyAuthEnabled ) { |
---|
368 | char * str = tr_strdup_printf( "%s:%s", session->proxyUsername, |
---|
369 | session->proxyPassword ); |
---|
370 | curl_easy_setopt( e, CURLOPT_PROXYUSERPWD, str ); |
---|
371 | tr_free( str ); |
---|
372 | } |
---|
373 | |
---|
374 | task->easy = e; |
---|
375 | task->multi = web->multi; |
---|
376 | |
---|
377 | /* use our own timeout instead of CURLOPT_TIMEOUT because the latter |
---|
378 | * doesn't play nicely with curl_multi. See curl bug #2501457 */ |
---|
379 | task->timer_event_isSet = TRUE; |
---|
380 | evtimer_set( &task->timer_event, task_timeout_cb, task ); |
---|
381 | tr_timerAdd( &task->timer_event, timeout, 0 ); |
---|
382 | |
---|
383 | curl_easy_setopt( e, CURLOPT_SOCKOPTFUNCTION, sockoptfunction ); |
---|
384 | curl_easy_setopt( e, CURLOPT_SOCKOPTDATA, task ); |
---|
385 | curl_easy_setopt( e, CURLOPT_WRITEDATA, task ); |
---|
386 | curl_easy_setopt( e, CURLOPT_WRITEFUNCTION, writeFunc ); |
---|
387 | curl_easy_setopt( e, CURLOPT_DNS_CACHE_TIMEOUT, MIN_DNS_CACHE_TIME ); |
---|
388 | curl_easy_setopt( e, CURLOPT_FOLLOWLOCATION, 1L ); |
---|
389 | curl_easy_setopt( e, CURLOPT_AUTOREFERER, 1L ); |
---|
390 | curl_easy_setopt( e, CURLOPT_PRIVATE, task ); |
---|
391 | curl_easy_setopt( e, CURLOPT_SSL_VERIFYHOST, 0L ); |
---|
392 | curl_easy_setopt( e, CURLOPT_SSL_VERIFYPEER, 0L ); |
---|
393 | curl_easy_setopt( e, CURLOPT_URL, task->resolved_url ? task->resolved_url : task->url ); |
---|
394 | curl_easy_setopt( e, CURLOPT_USERAGENT, user_agent ); |
---|
395 | curl_easy_setopt( e, CURLOPT_VERBOSE, verbose ); |
---|
396 | if( web->haveAddr ) |
---|
397 | curl_easy_setopt( e, CURLOPT_INTERFACE, tr_ntop_non_ts( &web->addr ) ); |
---|
398 | if( task->range ) |
---|
399 | curl_easy_setopt( e, CURLOPT_RANGE, task->range ); |
---|
400 | |
---|
401 | if( curl_multi_add_handle( web->multi, e ) == CURLM_OK ) |
---|
402 | ++web->taskCount; |
---|
403 | } |
---|
404 | } |
---|
405 | |
---|
406 | static void |
---|
407 | dns_ipv6_done_cb( int err, char type, int count, int ttl, void * addresses, void * vtask ) |
---|
408 | { |
---|
409 | struct tr_web_task * task = vtask; |
---|
410 | |
---|
411 | if( !err && task->host && ( count>0 ) && ( ttl>=0 ) && ( type==DNS_IPv6_AAAA ) ) |
---|
412 | { |
---|
413 | int i; |
---|
414 | char buf[INET6_ADDRSTRLEN+1]; |
---|
415 | struct in6_addr *in6_addrs = addresses; |
---|
416 | |
---|
417 | for( i=0; i<count; ++i ) { |
---|
418 | const char * b = inet_ntop(AF_INET6, &in6_addrs[i], buf,sizeof(buf)); |
---|
419 | if( b != NULL ) { |
---|
420 | /* FIXME: is there a better way to tell which one to use if count > 1? */ |
---|
421 | task->resolved_host = dns_cache_set_name( task, task->host, b, ttl ); |
---|
422 | break; |
---|
423 | } |
---|
424 | } |
---|
425 | } |
---|
426 | |
---|
427 | if( task->resolved_host == NULL ) |
---|
428 | dns_cache_set_fail( task, task->host ); |
---|
429 | |
---|
430 | addTask( task ); |
---|
431 | } |
---|
432 | |
---|
433 | static void |
---|
434 | dns_ipv4_done_cb( int err, char type, int count, int ttl, void * addresses, void * vtask ) |
---|
435 | { |
---|
436 | struct tr_web_task * task = vtask; |
---|
437 | |
---|
438 | if( !err && task->host && ( count>0 ) && ( ttl>=0 ) && ( type==DNS_IPv4_A ) ) |
---|
439 | { |
---|
440 | struct in_addr * in_addrs = addresses; |
---|
441 | const char * resolved = inet_ntoa( in_addrs[0] ); |
---|
442 | task->resolved_host = dns_cache_set_name( task, task->host, resolved, ttl ); |
---|
443 | /* FIXME: if count > 1, is there a way to decide which is best to use? */ |
---|
444 | } |
---|
445 | |
---|
446 | if( ( task->resolved_host != NULL ) |
---|
447 | || ( task->host == NULL ) |
---|
448 | || evdns_resolve_ipv6( task->host, 0, dns_ipv6_done_cb, task ) ) |
---|
449 | dns_ipv6_done_cb( DNS_ERR_UNKNOWN, DNS_IPv6_AAAA, 0, 0, NULL, task ); |
---|
450 | } |
---|
451 | |
---|
452 | static void |
---|
453 | doDNS( void * vtask ) |
---|
454 | { |
---|
455 | tr_address addr; |
---|
456 | int port = -1; |
---|
457 | char * host = NULL; |
---|
458 | struct tr_web_task * task = vtask; |
---|
459 | tr_dns_result lookup_result = TR_DNS_UNTESTED; |
---|
460 | |
---|
461 | assert( task->resolved_host == NULL ); |
---|
462 | |
---|
463 | if( !tr_httpParseURL( task->url, -1, &host, &port, NULL ) ) |
---|
464 | { |
---|
465 | task->port = port; |
---|
466 | task->host = host; |
---|
467 | |
---|
468 | /* If 'host' is an IPv4 or IPv6 address in text form, use it as-is. |
---|
469 | * Otherwise, see if its resolved name is in our DNS cache */ |
---|
470 | if( tr_pton( task->host, &addr ) != NULL ) |
---|
471 | { |
---|
472 | task->resolved_host = task->host; |
---|
473 | lookup_result = TR_DNS_OK; |
---|
474 | } |
---|
475 | else |
---|
476 | { |
---|
477 | lookup_result = dns_cache_lookup( task, host, &task->resolved_host ); |
---|
478 | } |
---|
479 | } |
---|
480 | |
---|
481 | if( lookup_result != TR_DNS_UNTESTED ) |
---|
482 | { |
---|
483 | addTask( task ); |
---|
484 | } |
---|
485 | else if( !host || evdns_resolve_ipv4( host, 0, dns_ipv4_done_cb, task ) ) |
---|
486 | { |
---|
487 | dns_ipv4_done_cb( DNS_ERR_UNKNOWN, DNS_IPv4_A, 0, 0, NULL, task ); |
---|
488 | } |
---|
489 | } |
---|
490 | |
---|
491 | /*** |
---|
492 | **** |
---|
493 | ***/ |
---|
494 | |
---|
495 | static void |
---|
496 | task_finish( struct tr_web_task * task, long response_code ) |
---|
497 | { |
---|
498 | dbgmsg( "finished web task %lu; got %ld", task->tag, response_code ); |
---|
499 | |
---|
500 | if( task->done_func != NULL ) |
---|
501 | task->done_func( task->session, |
---|
502 | response_code, |
---|
503 | EVBUFFER_DATA( task->response ), |
---|
504 | EVBUFFER_LENGTH( task->response ), |
---|
505 | task->done_func_user_data ); |
---|
506 | task_free( task ); |
---|
507 | } |
---|
508 | |
---|
509 | static void |
---|
510 | remove_task( struct tr_web_task * task ) |
---|
511 | { |
---|
512 | long code; |
---|
513 | |
---|
514 | curl_easy_getinfo( task->easy, CURLINFO_RESPONSE_CODE, &code ); |
---|
515 | curl_multi_remove_handle( task->multi, task->easy ); |
---|
516 | curl_easy_cleanup( task->easy ); |
---|
517 | task_finish( task, code ); |
---|
518 | } |
---|
519 | |
---|
520 | static void |
---|
521 | task_timeout_cb( int fd UNUSED, short what UNUSED, void * task ) |
---|
522 | { |
---|
523 | remove_task( task ); |
---|
524 | } |
---|
525 | |
---|
526 | static void |
---|
527 | remove_finished_tasks( tr_web * g ) |
---|
528 | { |
---|
529 | CURLMsg * msg; |
---|
530 | int msgs_left; |
---|
531 | |
---|
532 | while(( msg = curl_multi_info_read( g->multi, &msgs_left ))) { |
---|
533 | if(( msg->msg == CURLMSG_DONE ) && ( msg->easy_handle != NULL )) { |
---|
534 | struct tr_web_task * task; |
---|
535 | CURL * e = msg->easy_handle; |
---|
536 | curl_easy_getinfo( e, CURLINFO_PRIVATE, (void*)&task ); |
---|
537 | assert( e == task->easy ); |
---|
538 | remove_task( task ); |
---|
539 | } |
---|
540 | } |
---|
541 | } |
---|
542 | |
---|
543 | static void |
---|
544 | restart_timer( tr_web * g ) |
---|
545 | { |
---|
546 | dbgmsg( "adding a timeout for %.1f seconds from now", g->timer_msec/1000.0 ); |
---|
547 | evtimer_del( &g->timer_event ); |
---|
548 | tr_timerAddMsec( &g->timer_event, g->timer_msec ); |
---|
549 | } |
---|
550 | |
---|
551 | static void |
---|
552 | tr_multi_perform( tr_web * g, int fd, int curl_what ) |
---|
553 | { |
---|
554 | CURLMcode m; |
---|
555 | |
---|
556 | dbgmsg( "check_run_count: %d taskCount", g->taskCount ); |
---|
557 | |
---|
558 | /* invoke libcurl's processing */ |
---|
559 | do |
---|
560 | m = curl_multi_socket_action( g->multi, fd, curl_what, &g->taskCount ); |
---|
561 | while( m == CURLM_CALL_MULTI_SOCKET ); |
---|
562 | |
---|
563 | remove_finished_tasks( g ); |
---|
564 | |
---|
565 | if( g->closing && !g->taskCount ) |
---|
566 | web_free( g ); |
---|
567 | else |
---|
568 | restart_timer( g ); |
---|
569 | } |
---|
570 | |
---|
571 | /* libevent says that sock is ready to be processed, so wake up libcurl */ |
---|
572 | static void |
---|
573 | event_cb( int fd, short ev_what, void * g ) |
---|
574 | { |
---|
575 | int curl_what = 0; |
---|
576 | if( ev_what & EV_READ ) curl_what |= CURL_POLL_IN; |
---|
577 | if( ev_what & EV_WRITE ) curl_what |= CURL_POLL_OUT; |
---|
578 | tr_multi_perform( g, fd, curl_what ); |
---|
579 | } |
---|
580 | |
---|
581 | /* CURLMOPT_SOCKETFUNCTION */ |
---|
582 | static int |
---|
583 | sock_cb( CURL * e UNUSED, curl_socket_t fd, int curl_what, |
---|
584 | void * vweb, void * vevent ) |
---|
585 | { |
---|
586 | /*static int num_events = 0;*/ |
---|
587 | struct tr_web * web = vweb; |
---|
588 | struct event * io_event = vevent; |
---|
589 | dbgmsg( "sock_cb: curl_what %d, fd %d, io_event %p", |
---|
590 | curl_what, (int)fd, io_event ); |
---|
591 | |
---|
592 | if( io_event != NULL ) |
---|
593 | event_del( io_event ); |
---|
594 | |
---|
595 | if( curl_what & ( CURL_POLL_IN | CURL_POLL_OUT ) ) |
---|
596 | { |
---|
597 | const short ev_what = EV_PERSIST |
---|
598 | | (( curl_what & CURL_POLL_IN ) ? EV_READ : 0 ) |
---|
599 | | (( curl_what & CURL_POLL_OUT ) ? EV_WRITE : 0 ); |
---|
600 | |
---|
601 | if( io_event == NULL ) { |
---|
602 | io_event = tr_new0( struct event, 1 ); |
---|
603 | curl_multi_assign( web->multi, fd, io_event ); |
---|
604 | /*fprintf( stderr, "+1 io_events to %d\n", ++num_events );*/ |
---|
605 | } |
---|
606 | |
---|
607 | dbgmsg( "enabling (libevent %hd, libcurl %d) on io_event %p, fd %d", |
---|
608 | ev_what, curl_what, io_event, fd ); |
---|
609 | event_set( io_event, fd, ev_what, event_cb, web ); |
---|
610 | assert( io_event->ev_base != NULL ); |
---|
611 | event_add( io_event, NULL ); |
---|
612 | } |
---|
613 | |
---|
614 | if( ( io_event != NULL ) && ( curl_what & CURL_POLL_REMOVE ) ) |
---|
615 | { |
---|
616 | memset( io_event, TR_MEMORY_TRASH, sizeof( struct event ) ); |
---|
617 | tr_free( io_event ); |
---|
618 | /*fprintf( stderr, "-1 io_events to %d\n", --num_events );*/ |
---|
619 | } |
---|
620 | |
---|
621 | return 0; /* libcurl documentation: "The callback MUST return 0." */ |
---|
622 | } |
---|
623 | |
---|
624 | /* libevent says that timer_msec have passed, so wake up libcurl */ |
---|
625 | static void |
---|
626 | libevent_timer_cb( int fd UNUSED, short what UNUSED, void * g ) |
---|
627 | { |
---|
628 | dbgmsg( "libevent timer is done" ); |
---|
629 | tr_multi_perform( g, CURL_SOCKET_TIMEOUT, 0 ); |
---|
630 | } |
---|
631 | |
---|
632 | /* libcurl documentation: "If 0, it means you should proceed immediately |
---|
633 | * without waiting for anything. If it returns -1, there's no timeout at all |
---|
634 | * set ... (but) you must not wait too long (more than a few seconds perhaps) |
---|
635 | * before you call curl_multi_perform() again." */ |
---|
636 | static void |
---|
637 | multi_timer_cb( CURLM * multi UNUSED, long timer_msec, void * vg ) |
---|
638 | { |
---|
639 | tr_web * g = vg; |
---|
640 | |
---|
641 | g->timer_msec = timer_msec > 0 ? timer_msec : DEFAULT_TIMER_MSEC; |
---|
642 | |
---|
643 | if( timer_msec < 1 ) |
---|
644 | tr_multi_perform( g, CURL_SOCKET_TIMEOUT, 0 ); |
---|
645 | else |
---|
646 | restart_timer( g ); |
---|
647 | } |
---|
648 | |
---|
649 | /**** |
---|
650 | ***** |
---|
651 | ****/ |
---|
652 | |
---|
653 | void |
---|
654 | tr_webRun( tr_session * session, |
---|
655 | const char * url, |
---|
656 | const char * range, |
---|
657 | tr_web_done_func done_func, |
---|
658 | void * done_func_user_data ) |
---|
659 | { |
---|
660 | if( session->web != NULL ) |
---|
661 | { |
---|
662 | static unsigned long tag = 0; |
---|
663 | struct tr_web_task * task = tr_new0( struct tr_web_task, 1 ); |
---|
664 | task->session = session; |
---|
665 | task->url = tr_strdup( url ); |
---|
666 | task->range = tr_strdup( range ); |
---|
667 | task->done_func = done_func; |
---|
668 | task->done_func_user_data = done_func_user_data; |
---|
669 | task->tag = ++tag; |
---|
670 | task->response = evbuffer_new( ); |
---|
671 | tr_runInEventThread( session, doDNS, task ); |
---|
672 | } |
---|
673 | } |
---|
674 | |
---|
675 | void |
---|
676 | tr_webSetInterface( tr_web * web, const tr_address * addr ) |
---|
677 | { |
---|
678 | if(( web->haveAddr = ( addr != NULL ))) |
---|
679 | web->addr = *addr; |
---|
680 | } |
---|
681 | |
---|
682 | tr_web* |
---|
683 | tr_webInit( tr_session * session ) |
---|
684 | { |
---|
685 | tr_web * web; |
---|
686 | |
---|
687 | /* try to enable ssl for https support; but if that fails, |
---|
688 | * try a plain vanilla init */ |
---|
689 | if( curl_global_init( CURL_GLOBAL_SSL ) ) |
---|
690 | curl_global_init( 0 ); |
---|
691 | |
---|
692 | web = tr_new0( struct tr_web, 1 ); |
---|
693 | web->dns_cache = TR_PTR_ARRAY_INIT; |
---|
694 | web->session = session; |
---|
695 | web->timer_msec = DEFAULT_TIMER_MSEC; /* overwritten by multi_timer_cb() */ |
---|
696 | evtimer_set( &web->timer_event, libevent_timer_cb, web ); |
---|
697 | |
---|
698 | web->multi = curl_multi_init( ); |
---|
699 | |
---|
700 | evdns_init( ); |
---|
701 | |
---|
702 | curl_multi_setopt( web->multi, CURLMOPT_SOCKETDATA, web ); |
---|
703 | curl_multi_setopt( web->multi, CURLMOPT_SOCKETFUNCTION, sock_cb ); |
---|
704 | curl_multi_setopt( web->multi, CURLMOPT_TIMERDATA, web ); |
---|
705 | curl_multi_setopt( web->multi, CURLMOPT_TIMERFUNCTION, multi_timer_cb ); |
---|
706 | |
---|
707 | return web; |
---|
708 | } |
---|
709 | |
---|
710 | void |
---|
711 | tr_webClose( tr_web ** web_in ) |
---|
712 | { |
---|
713 | tr_web * web = *web_in; |
---|
714 | *web_in = NULL; |
---|
715 | if( web->taskCount < 1 ) |
---|
716 | web_free( web ); |
---|
717 | else |
---|
718 | web->closing = 1; |
---|
719 | } |
---|
720 | |
---|
721 | /***** |
---|
722 | ****** |
---|
723 | ****** |
---|
724 | *****/ |
---|
725 | |
---|
726 | const char * |
---|
727 | tr_webGetResponseStr( long code ) |
---|
728 | { |
---|
729 | switch( code ) |
---|
730 | { |
---|
731 | case 0: return "No Response"; |
---|
732 | case 101: return "Switching Protocols"; |
---|
733 | case 200: return "OK"; |
---|
734 | case 201: return "Created"; |
---|
735 | case 202: return "Accepted"; |
---|
736 | case 203: return "Non-Authoritative Information"; |
---|
737 | case 204: return "No Content"; |
---|
738 | case 205: return "Reset Content"; |
---|
739 | case 206: return "Partial Content"; |
---|
740 | case 300: return "Multiple Choices"; |
---|
741 | case 301: return "Moved Permanently"; |
---|
742 | case 302: return "Found"; |
---|
743 | case 303: return "See Other"; |
---|
744 | case 304: return "Not Modified"; |
---|
745 | case 305: return "Use Proxy"; |
---|
746 | case 306: return "(Unused)"; |
---|
747 | case 307: return "Temporary Redirect"; |
---|
748 | case 400: return "Bad Request"; |
---|
749 | case 401: return "Unauthorized"; |
---|
750 | case 402: return "Payment Required"; |
---|
751 | case 403: return "Forbidden"; |
---|
752 | case 404: return "Not Found"; |
---|
753 | case 405: return "Method Not Allowed"; |
---|
754 | case 406: return "Not Acceptable"; |
---|
755 | case 407: return "Proxy Authentication Required"; |
---|
756 | case 408: return "Request Timeout"; |
---|
757 | case 409: return "Conflict"; |
---|
758 | case 410: return "Gone"; |
---|
759 | case 411: return "Length Required"; |
---|
760 | case 412: return "Precondition Failed"; |
---|
761 | case 413: return "Request Entity Too Large"; |
---|
762 | case 414: return "Request-URI Too Long"; |
---|
763 | case 415: return "Unsupported Media Type"; |
---|
764 | case 416: return "Requested Range Not Satisfiable"; |
---|
765 | case 417: return "Expectation Failed"; |
---|
766 | case 500: return "Internal Server Error"; |
---|
767 | case 501: return "Not Implemented"; |
---|
768 | case 502: return "Bad Gateway"; |
---|
769 | case 503: return "Service Unavailable"; |
---|
770 | case 504: return "Gateway Timeout"; |
---|
771 | case 505: return "HTTP Version Not Supported"; |
---|
772 | default: return "Unknown Error"; |
---|
773 | } |
---|
774 | } |
---|
775 | |
---|
776 | void |
---|
777 | tr_http_escape( struct evbuffer * out, |
---|
778 | const char * str, int len, tr_bool escape_slashes ) |
---|
779 | { |
---|
780 | int i; |
---|
781 | |
---|
782 | if( ( len < 0 ) && ( str != NULL ) ) |
---|
783 | len = strlen( str ); |
---|
784 | |
---|
785 | for( i = 0; i < len; i++ ) { |
---|
786 | if( str[i] == ',' || str[i] == '-' || str[i] == '.' |
---|
787 | || ( '0' <= str[i] && str[i] <= '9' ) |
---|
788 | || ( 'A' <= str[i] && str[i] <= 'Z' ) |
---|
789 | || ( 'a' <= str[i] && str[i] <= 'z' ) |
---|
790 | || ( str[i] == '/' && !escape_slashes ) ) |
---|
791 | evbuffer_add( out, &str[i], 1 ); |
---|
792 | else |
---|
793 | evbuffer_add_printf( out, "%%%02X", (unsigned)(str[i]&0xFF) ); |
---|
794 | } |
---|
795 | } |
---|
796 | |
---|
797 | char * |
---|
798 | tr_http_unescape( const char * str, int len ) |
---|
799 | { |
---|
800 | char * tmp = curl_unescape( str, len ); |
---|
801 | char * ret = tr_strdup( tmp ); |
---|
802 | curl_free( tmp ); |
---|
803 | return ret; |
---|
804 | } |
---|