1 |
|
/* ============================================================================ |
2 |
|
* Douglas Thrift's Search Engine License |
3 |
|
* |
4 |
< |
* Copyright (C) 2002, Douglas Thrift. All Rights Reserved. |
4 |
> |
* Copyright (C) 2002-2003, Douglas Thrift. All Rights Reserved. |
5 |
|
* Redistribution and use in source and binary forms, with or without |
6 |
|
* modification, are permitted provided that the following conditions are met: |
7 |
|
* |
46 |
|
// |
47 |
|
// Douglas Thrift |
48 |
|
// |
49 |
< |
// HttpHandler.cpp |
49 |
> |
// $Id: HttpHandler.cpp,v 1.19 2003/07/15 08:01:00 douglas Exp $ |
50 |
|
|
51 |
|
#include "HttpHandler.h" |
52 |
|
|
53 |
+ |
// Lovely C Sockets! |
54 |
+ |
#ifndef _WIN32 |
55 |
+ |
// BSD Sockets |
56 |
+ |
#include <unistd.h> |
57 |
+ |
#include <sys/types.h> |
58 |
+ |
#include <sys/socket.h> |
59 |
+ |
#include <netinet/in.h> |
60 |
+ |
#include <netdb.h> |
61 |
+ |
|
62 |
+ |
#define INVALID_SOCKET -1 |
63 |
+ |
#define SOCKET_ERROR -1 |
64 |
+ |
|
65 |
+ |
inline int closesocket(SOCKET s) { return close(s); } |
66 |
+ |
#endif |
67 |
+ |
|
68 |
|
HttpHandler::HttpHandler() |
69 |
|
{ |
70 |
|
buffer = new char[BUFSIZ + 1]; |
79 |
|
|
80 |
|
length = 0; |
81 |
|
chunked = false; |
82 |
+ |
#ifdef _OpenSSL_ |
83 |
+ |
tls = false; |
84 |
+ |
#endif |
85 |
|
} |
86 |
|
|
87 |
|
HttpHandler::~HttpHandler() |
134 |
|
} |
135 |
|
|
136 |
|
putline("Accept: text/html; text/plain"); |
137 |
+ |
#ifndef _OpenSSL_ |
138 |
|
putline("User-Agent: " + agent(true) + ' ' + platform()); |
139 |
+ |
#else |
140 |
+ |
putline("User-Agent: " + agent(true) + ' ' + platform() + ' ' |
141 |
+ |
+ openssl(true)); |
142 |
+ |
#endif |
143 |
|
|
144 |
|
if (url.getPort() == 80) |
145 |
|
{ |
289 |
|
location = ""; |
290 |
|
page = ""; |
291 |
|
chunked = false; |
292 |
+ |
#ifdef _OpenSSL_ |
293 |
+ |
tls = false; |
294 |
+ |
#endif |
295 |
|
} |
296 |
|
|
297 |
|
void HttpHandler::populate() |
307 |
|
unsigned bytes = left > BUFSIZ ? BUFSIZ : left; |
308 |
|
unsigned received; |
309 |
|
|
310 |
< |
if ((received = recv(http, buffer, bytes, 0)) == SOCKET_ERROR) |
285 |
< |
{ |
286 |
< |
error(program + ": Recv"); |
287 |
< |
exit(1); |
288 |
< |
} |
289 |
< |
else if (received != bytes) |
310 |
> |
while (true) |
311 |
|
{ |
312 |
< |
left -= received; |
292 |
< |
page += buffer; |
293 |
< |
|
294 |
< |
memset(buffer, 0, BUFSIZ + 1); |
295 |
< |
|
296 |
< |
bytes -= received; |
297 |
< |
if (recv(http, buffer, bytes, 0) == SOCKET_ERROR) |
312 |
> |
if ((received = recv(http, buffer, bytes, 0)) == SOCKET_ERROR) |
313 |
|
{ |
314 |
|
error(program + ": Recv"); |
315 |
|
exit(1); |
316 |
|
} |
317 |
+ |
else if (received != bytes) |
318 |
+ |
{ |
319 |
+ |
left -= received; |
320 |
+ |
page += buffer; |
321 |
+ |
|
322 |
+ |
memset(buffer, 0, BUFSIZ + 1); |
323 |
+ |
|
324 |
+ |
bytes -= received; |
325 |
+ |
} |
326 |
+ |
else |
327 |
+ |
{ |
328 |
+ |
break; |
329 |
+ |
} |
330 |
|
} |
331 |
|
|
332 |
|
page += buffer; |
350 |
|
unsigned bytes = left > BUFSIZ ? BUFSIZ : left; |
351 |
|
unsigned received; |
352 |
|
|
353 |
< |
if ((received = recv(http, buffer, bytes, 0)) == SOCKET_ERROR) |
326 |
< |
{ |
327 |
< |
error(program + ": Recv"); |
328 |
< |
exit(1); |
329 |
< |
} |
330 |
< |
else if (received != bytes) |
353 |
> |
while (true) |
354 |
|
{ |
355 |
< |
left -= received; |
356 |
< |
page += buffer; |
334 |
< |
|
335 |
< |
memset(buffer, 0, BUFSIZ + 1); |
336 |
< |
|
337 |
< |
bytes -= received; |
338 |
< |
if (recv(http, buffer, bytes, 0) == SOCKET_ERROR) |
355 |
> |
if ((received = recv(http, buffer, bytes, 0)) == |
356 |
> |
SOCKET_ERROR) |
357 |
|
{ |
358 |
|
error(program + ": Recv"); |
359 |
|
exit(1); |
360 |
|
} |
361 |
+ |
else if (received != bytes) |
362 |
+ |
{ |
363 |
+ |
left -= received; |
364 |
+ |
page += buffer; |
365 |
+ |
|
366 |
+ |
memset(buffer, 0, BUFSIZ + 1); |
367 |
+ |
|
368 |
+ |
bytes -= received; |
369 |
+ |
} |
370 |
+ |
else |
371 |
+ |
{ |
372 |
+ |
break; |
373 |
+ |
} |
374 |
|
} |
375 |
|
|
376 |
|
page += buffer; |
437 |
|
switch (WSAGetLastError()) |
438 |
|
{ |
439 |
|
case WSAEACCES: |
440 |
< |
error = "Permission denied."; |
440 |
> |
error = "Permission denied"; |
441 |
|
break; |
442 |
|
case WSAEADDRINUSE: |
443 |
< |
error = "Address already in use."; |
443 |
> |
error = "Address already in use"; |
444 |
|
break; |
445 |
|
case WSAEADDRNOTAVAIL: |
446 |
< |
error = "Cannot assign requested address."; |
446 |
> |
error = "Cannot assign requested address"; |
447 |
|
break; |
448 |
|
case WSAEAFNOSUPPORT: |
449 |
< |
error = "Address family not supported by protocol family."; |
449 |
> |
error = "Address family not supported by protocol family"; |
450 |
|
break; |
451 |
|
case WSAEALREADY: |
452 |
< |
error = "Operation already in progress."; |
452 |
> |
error = "Operation already in progress"; |
453 |
|
break; |
454 |
|
case WSAECONNABORTED: |
455 |
< |
error = "Software caused connection abort."; |
455 |
> |
error = "Software caused connection abort"; |
456 |
|
break; |
457 |
|
case WSAECONNREFUSED: |
458 |
< |
error = "Connection refused."; |
458 |
> |
error = "Connection refused"; |
459 |
|
break; |
460 |
|
case WSAECONNRESET: |
461 |
< |
error = "Connection reset by peer."; |
461 |
> |
error = "Connection reset by peer"; |
462 |
|
break; |
463 |
|
case WSAEDESTADDRREQ: |
464 |
< |
error = "Destination address required."; |
464 |
> |
error = "Destination address required"; |
465 |
|
break; |
466 |
|
case WSAEFAULT: |
467 |
< |
error = "Bad address."; |
467 |
> |
error = "Bad address"; |
468 |
|
break; |
469 |
|
case WSAEHOSTDOWN: |
470 |
< |
error = "Host is down."; |
470 |
> |
error = "Host is down"; |
471 |
|
break; |
472 |
|
case WSAEHOSTUNREACH: |
473 |
< |
error = "No route to host."; |
473 |
> |
error = "No route to host"; |
474 |
|
break; |
475 |
|
case WSAEINPROGRESS: |
476 |
< |
error = "Operation now in progress."; |
476 |
> |
error = "Operation now in progress"; |
477 |
|
break; |
478 |
|
case WSAEINTR: |
479 |
< |
error = "Interrupted function call."; |
479 |
> |
error = "Interrupted function call"; |
480 |
|
break; |
481 |
|
case WSAEINVAL: |
482 |
< |
error = "Invalid argument."; |
482 |
> |
error = "Invalid argument"; |
483 |
|
break; |
484 |
|
case WSAEISCONN: |
485 |
< |
error = "Socket is already connected."; |
485 |
> |
error = "Socket is already connected"; |
486 |
|
break; |
487 |
|
case WSAEMFILE: |
488 |
< |
error = "Too many open files."; |
488 |
> |
error = "Too many open files"; |
489 |
|
break; |
490 |
|
case WSAEMSGSIZE: |
491 |
< |
error = "Message too long."; |
491 |
> |
error = "Message too long"; |
492 |
|
break; |
493 |
|
case WSAENETDOWN: |
494 |
< |
error = "Network is down."; |
494 |
> |
error = "Network is down"; |
495 |
|
break; |
496 |
|
case WSAENETRESET: |
497 |
< |
error = "Network dropped connection on reset."; |
497 |
> |
error = "Network dropped connection on reset"; |
498 |
|
break; |
499 |
|
case WSAENETUNREACH: |
500 |
< |
error = "Network is unreachable."; |
500 |
> |
error = "Network is unreachable"; |
501 |
|
break; |
502 |
|
case WSAENOBUFS: |
503 |
< |
error = "No buffer space available."; |
503 |
> |
error = "No buffer space available"; |
504 |
|
break; |
505 |
|
case WSAENOPROTOOPT: |
506 |
< |
error = "Bad protocol option."; |
506 |
> |
error = "Bad protocol option"; |
507 |
|
break; |
508 |
|
case WSAENOTCONN: |
509 |
< |
error = "Socket is not connected."; |
509 |
> |
error = "Socket is not connected"; |
510 |
|
break; |
511 |
|
case WSAENOTSOCK: |
512 |
< |
error = "Socket operation on non-socket."; |
512 |
> |
error = "Socket operation on non-socket"; |
513 |
|
break; |
514 |
|
case WSAEOPNOTSUPP: |
515 |
< |
error = "Operation not supported."; |
515 |
> |
error = "Operation not supported"; |
516 |
|
break; |
517 |
|
case WSAEPFNOSUPPORT: |
518 |
< |
error = "Protocol family not supported."; |
518 |
> |
error = "Protocol family not supported"; |
519 |
|
break; |
520 |
|
case WSAEPROCLIM: |
521 |
< |
error = "Too many processes."; |
521 |
> |
error = "Too many processes"; |
522 |
|
break; |
523 |
|
case WSAEPROTONOSUPPORT: |
524 |
< |
error = "Protocol not supported."; |
524 |
> |
error = "Protocol not supported"; |
525 |
|
break; |
526 |
|
case WSAEPROTOTYPE: |
527 |
< |
error = "Protocol wrong type for socket."; |
527 |
> |
error = "Protocol wrong type for socket"; |
528 |
|
break; |
529 |
|
case WSAESHUTDOWN: |
530 |
< |
error = "Cannot send after socket shutdown."; |
530 |
> |
error = "Cannot send after socket shutdown"; |
531 |
|
break; |
532 |
|
case WSAESOCKTNOSUPPORT: |
533 |
< |
error = "Socket type not supported."; |
533 |
> |
error = "Socket type not supported"; |
534 |
|
break; |
535 |
|
case WSAETIMEDOUT: |
536 |
< |
error = "Connection timed out."; |
536 |
> |
error = "Connection timed out"; |
537 |
|
break; |
538 |
|
case WSATYPE_NOT_FOUND: |
539 |
< |
error = "Class type not found."; |
539 |
> |
error = "Class type not found"; |
540 |
|
break; |
541 |
|
case WSAEWOULDBLOCK: |
542 |
< |
error = "Resource temporarily unavailable."; |
542 |
> |
error = "Resource temporarily unavailable"; |
543 |
|
break; |
544 |
|
case WSAHOST_NOT_FOUND: |
545 |
< |
error = "Host not found."; |
545 |
> |
error = "Host not found"; |
546 |
|
break; |
547 |
|
case WSA_INVALID_HANDLE: |
548 |
< |
error = "Specified event object handle is invalid."; |
548 |
> |
error = "Specified event object handle is invalid"; |
549 |
|
break; |
550 |
|
case WSA_INVALID_PARAMETER: |
551 |
< |
error = "One or more parameters are invalid."; |
551 |
> |
error = "One or more parameters are invalid"; |
552 |
|
break; |
553 |
|
// case WSAINVALIDPROCTABLE: |
554 |
< |
// error = "Invalid procedure table from service provider."; |
554 |
> |
// error = "Invalid procedure table from service provider"; |
555 |
|
// break; |
556 |
|
// case WSAINVALIDPROVIDER: |
557 |
< |
// error = "Invalid service provider version number."; |
557 |
> |
// error = "Invalid service provider version number"; |
558 |
|
// break; |
559 |
|
case WSA_IO_INCOMPLETE: |
560 |
< |
error = "Overlapped I/O event object not in signaled state."; |
560 |
> |
error = "Overlapped I/O event object not in signaled state"; |
561 |
|
break; |
562 |
|
case WSA_IO_PENDING: |
563 |
< |
error = "Overlapped operations will complete later."; |
563 |
> |
error = "Overlapped operations will complete later"; |
564 |
|
break; |
565 |
|
case WSA_NOT_ENOUGH_MEMORY: |
566 |
< |
error = "Insufficient memory available."; |
566 |
> |
error = "Insufficient memory available"; |
567 |
|
break; |
568 |
|
case WSANOTINITIALISED: |
569 |
< |
error = "Successful WSAStartup not yet performed."; |
569 |
> |
error = "Successful WSAStartup not yet performed"; |
570 |
|
break; |
571 |
|
case WSANO_DATA: |
572 |
< |
error = "Valid name, no data record of requested type."; |
572 |
> |
error = "Valid name, no data record of requested type"; |
573 |
|
break; |
574 |
|
case WSANO_RECOVERY: |
575 |
< |
error = "This is a non-recoverable error."; |
575 |
> |
error = "This is a non-recoverable error"; |
576 |
|
break; |
577 |
|
// case WSAPROVIDERFAILEDINIT: |
578 |
< |
// error = "Unable to initialize a service provider."; |
578 |
> |
// error = "Unable to initialize a service provider"; |
579 |
|
// break; |
580 |
|
case WSASYSCALLFAILURE: |
581 |
< |
error = "System call failure."; |
581 |
> |
error = "System call failure"; |
582 |
|
break; |
583 |
|
case WSASYSNOTREADY: |
584 |
< |
error = "Network subsystem is unavailable."; |
584 |
> |
error = "Network subsystem is unavailable"; |
585 |
|
break; |
586 |
|
case WSATRY_AGAIN: |
587 |
< |
error = "Non-authoritative host not found."; |
587 |
> |
error = "Non-authoritative host not found"; |
588 |
|
break; |
589 |
|
case WSAVERNOTSUPPORTED: |
590 |
< |
error = "WINSOCK.DLL version out of range."; |
590 |
> |
error = "WINSOCK.DLL version out of range"; |
591 |
|
break; |
592 |
|
case WSAEDISCON: |
593 |
< |
error = "Graceful shutdown in progress."; |
593 |
> |
error = "Graceful shutdown in progress"; |
594 |
|
break; |
595 |
|
case WSA_OPERATION_ABORTED: |
596 |
< |
error = "Overlapped operation aborted."; |
596 |
> |
error = "Overlapped operation aborted"; |
597 |
|
break; |
598 |
|
default: |
599 |
< |
error = "Unknown error."; |
599 |
> |
error = "Unknown error"; |
600 |
|
break; |
601 |
|
} |
602 |
|
|
604 |
|
#else |
605 |
|
if (host) |
606 |
|
{ |
607 |
< |
herror(prefix.c_str()); |
607 |
> |
string error; |
608 |
> |
|
609 |
> |
switch (h_errno) |
610 |
> |
{ |
611 |
> |
case HOST_NOT_FOUND: |
612 |
> |
error = "Unknown host"; |
613 |
> |
break; |
614 |
> |
case TRY_AGAIN: |
615 |
> |
error = "Host name lookup failure"; |
616 |
> |
break; |
617 |
> |
case NO_RECOVERY: |
618 |
> |
error = "Unknown server error"; |
619 |
> |
break; |
620 |
> |
case NO_DATA: |
621 |
> |
error = "No address associated with name"; |
622 |
> |
break; |
623 |
> |
default: |
624 |
> |
error = "Unknown error"; |
625 |
> |
break; |
626 |
> |
} |
627 |
> |
|
628 |
> |
cerr << prefix << ": " << error << "\n"; |
629 |
|
} |
630 |
|
else |
631 |
|
{ |