[doc/apt-get.8.xml]
[ntk/apt.git] / methods / http.cc
CommitLineData
be4401bf
AL
1// -*- mode: cpp; mode: fold -*-
2// Description /*{{{*/
2cbcabd8 3// $Id: http.cc,v 1.59 2004/05/08 19:42:35 mdz Exp $
be4401bf
AL
4/* ######################################################################
5
ae58a985 6 HTTP Acquire Method - This is the HTTP aquire method for APT.
be4401bf
AL
7
8 It uses HTTP/1.1 and many of the fancy options there-in, such as
e836f356
AL
9 pipelining, range, if-range and so on.
10
11 It is based on a doubly buffered select loop. A groupe of requests are
be4401bf
AL
12 fed into a single output buffer that is constantly fed out the
13 socket. This provides ideal pipelining as in many cases all of the
14 requests will fit into a single packet. The input socket is buffered
e836f356 15 the same way and fed into the fd for the file (may be a pipe in future).
be4401bf
AL
16
17 This double buffering provides fairly substantial transfer rates,
18 compared to wget the http method is about 4% faster. Most importantly,
19 when HTTP is compared with FTP as a protocol the speed difference is
20 huge. In tests over the internet from two sites to llug (via ATM) this
21 program got 230k/s sustained http transfer rates. FTP on the other
22 hand topped out at 170k/s. That combined with the time to setup the
23 FTP connection makes HTTP a vastly superior protocol.
24
25 ##################################################################### */
26 /*}}}*/
27// Include Files /*{{{*/
28#include <apt-pkg/fileutl.h>
29#include <apt-pkg/acquire-method.h>
30#include <apt-pkg/error.h>
63b1700f 31#include <apt-pkg/hashes.h>
be4401bf
AL
32
33#include <sys/stat.h>
34#include <sys/time.h>
35#include <utime.h>
36#include <unistd.h>
492f957a 37#include <signal.h>
be4401bf 38#include <stdio.h>
65a1e968 39#include <errno.h>
42195eb2
AL
40#include <string.h>
41#include <iostream>
15d7e515 42#include <map>
d77559ac 43#include <apti18n.h>
be4401bf
AL
44
45// Internet stuff
0837bd25 46#include <netdb.h>
be4401bf 47
59b46c41 48#include "config.h"
0837bd25 49#include "connect.h"
934b6582 50#include "rfc2553emu.h"
be4401bf 51#include "http.h"
934b6582 52
be4401bf 53 /*}}}*/
42195eb2 54using namespace std;
be4401bf 55
492f957a
AL
56string HttpMethod::FailFile;
57int HttpMethod::FailFd = -1;
58time_t HttpMethod::FailTime = 0;
c37030c2 59unsigned long PipelineDepth = 10;
3000ccea 60unsigned long TimeOut = 120;
15d7e515 61bool AllowRedirect = false;
c98b1307 62bool Debug = false;
c37030c2 63URI Proxy;
492f957a 64
7c6e2dc7
MV
65unsigned long CircleBuf::BwReadLimit=0;
66unsigned long CircleBuf::BwTickReadData=0;
67struct timeval CircleBuf::BwReadTick={0,0};
68const unsigned int CircleBuf::BW_HZ=10;
69
be4401bf
AL
70// CircleBuf::CircleBuf - Circular input buffer /*{{{*/
71// ---------------------------------------------------------------------
72/* */
63b1700f 73CircleBuf::CircleBuf(unsigned long Size) : Size(Size), Hash(0)
be4401bf
AL
74{
75 Buf = new unsigned char[Size];
76 Reset();
7c6e2dc7
MV
77
78 CircleBuf::BwReadLimit = _config->FindI("Acquire::http::Dl-Limit",0)*1024;
be4401bf
AL
79}
80 /*}}}*/
81// CircleBuf::Reset - Reset to the default state /*{{{*/
82// ---------------------------------------------------------------------
83/* */
84void CircleBuf::Reset()
85{
86 InP = 0;
87 OutP = 0;
88 StrPos = 0;
89 MaxGet = (unsigned int)-1;
90 OutQueue = string();
63b1700f 91 if (Hash != 0)
be4401bf 92 {
63b1700f
AL
93 delete Hash;
94 Hash = new Hashes;
be4401bf
AL
95 }
96};
97 /*}}}*/
98// CircleBuf::Read - Read from a FD into the circular buffer /*{{{*/
99// ---------------------------------------------------------------------
100/* This fills up the buffer with as much data as is in the FD, assuming it
101 is non-blocking.. */
102bool CircleBuf::Read(int Fd)
103{
7c6e2dc7
MV
104 unsigned long BwReadMax;
105
be4401bf
AL
106 while (1)
107 {
108 // Woops, buffer is full
109 if (InP - OutP == Size)
110 return true;
7c6e2dc7
MV
111
112 // what's left to read in this tick
113 BwReadMax = CircleBuf::BwReadLimit/BW_HZ;
114
115 if(CircleBuf::BwReadLimit) {
116 struct timeval now;
117 gettimeofday(&now,0);
118
119 unsigned long d = (now.tv_sec-CircleBuf::BwReadTick.tv_sec)*1000000 +
120 now.tv_usec-CircleBuf::BwReadTick.tv_usec;
121 if(d > 1000000/BW_HZ) {
122 CircleBuf::BwReadTick = now;
123 CircleBuf::BwTickReadData = 0;
124 }
125
126 if(CircleBuf::BwTickReadData >= BwReadMax) {
127 usleep(1000000/BW_HZ);
128 return true;
129 }
130 }
131
be4401bf
AL
132 // Write the buffer segment
133 int Res;
7c6e2dc7
MV
134 if(CircleBuf::BwReadLimit) {
135 Res = read(Fd,Buf + (InP%Size),
136 BwReadMax > LeftRead() ? LeftRead() : BwReadMax);
137 } else
138 Res = read(Fd,Buf + (InP%Size),LeftRead());
be4401bf 139
7c6e2dc7
MV
140 if(Res > 0 && BwReadLimit > 0)
141 CircleBuf::BwTickReadData += Res;
142
be4401bf
AL
143 if (Res == 0)
144 return false;
145 if (Res < 0)
146 {
147 if (errno == EAGAIN)
148 return true;
149 return false;
150 }
151
152 if (InP == 0)
153 gettimeofday(&Start,0);
154 InP += Res;
155 }
156}
157 /*}}}*/
158// CircleBuf::Read - Put the string into the buffer /*{{{*/
159// ---------------------------------------------------------------------
160/* This will hold the string in and fill the buffer with it as it empties */
161bool CircleBuf::Read(string Data)
162{
163 OutQueue += Data;
164 FillOut();
165 return true;
166}
167 /*}}}*/
168// CircleBuf::FillOut - Fill the buffer from the output queue /*{{{*/
169// ---------------------------------------------------------------------
170/* */
171void CircleBuf::FillOut()
172{
173 if (OutQueue.empty() == true)
174 return;
175 while (1)
176 {
177 // Woops, buffer is full
178 if (InP - OutP == Size)
179 return;
180
181 // Write the buffer segment
182 unsigned long Sz = LeftRead();
183 if (OutQueue.length() - StrPos < Sz)
184 Sz = OutQueue.length() - StrPos;
42195eb2 185 memcpy(Buf + (InP%Size),OutQueue.c_str() + StrPos,Sz);
be4401bf
AL
186
187 // Advance
188 StrPos += Sz;
189 InP += Sz;
190 if (OutQueue.length() == StrPos)
191 {
192 StrPos = 0;
193 OutQueue = "";
194 return;
195 }
196 }
197}
198 /*}}}*/
199// CircleBuf::Write - Write from the buffer into a FD /*{{{*/
200// ---------------------------------------------------------------------
201/* This empties the buffer into the FD. */
202bool CircleBuf::Write(int Fd)
203{
204 while (1)
205 {
206 FillOut();
207
208 // Woops, buffer is empty
209 if (OutP == InP)
210 return true;
211
212 if (OutP == MaxGet)
213 return true;
214
215 // Write the buffer segment
216 int Res;
217 Res = write(Fd,Buf + (OutP%Size),LeftWrite());
218
219 if (Res == 0)
220 return false;
221 if (Res < 0)
222 {
223 if (errno == EAGAIN)
224 return true;
225
226 return false;
227 }
228
63b1700f
AL
229 if (Hash != 0)
230 Hash->Add(Buf + (OutP%Size),Res);
be4401bf
AL
231
232 OutP += Res;
233 }
234}
235 /*}}}*/
236// CircleBuf::WriteTillEl - Write from the buffer to a string /*{{{*/
237// ---------------------------------------------------------------------
238/* This copies till the first empty line */
239bool CircleBuf::WriteTillEl(string &Data,bool Single)
240{
241 // We cheat and assume it is unneeded to have more than one buffer load
242 for (unsigned long I = OutP; I < InP; I++)
243 {
244 if (Buf[I%Size] != '\n')
245 continue;
2cbcabd8 246 ++I;
be4401bf
AL
247
248 if (Single == false)
249 {
2cbcabd8
AL
250 if (I < InP && Buf[I%Size] == '\r')
251 ++I;
927c393f
MV
252 if (I >= InP || Buf[I%Size] != '\n')
253 continue;
254 ++I;
be4401bf
AL
255 }
256
be4401bf
AL
257 Data = "";
258 while (OutP < I)
259 {
260 unsigned long Sz = LeftWrite();
261 if (Sz == 0)
262 return false;
927c393f 263 if (I - OutP < Sz)
be4401bf
AL
264 Sz = I - OutP;
265 Data += string((char *)(Buf + (OutP%Size)),Sz);
266 OutP += Sz;
267 }
268 return true;
269 }
270 return false;
271}
272 /*}}}*/
273// CircleBuf::Stats - Print out stats information /*{{{*/
274// ---------------------------------------------------------------------
275/* */
276void CircleBuf::Stats()
277{
278 if (InP == 0)
279 return;
280
281 struct timeval Stop;
282 gettimeofday(&Stop,0);
283/* float Diff = Stop.tv_sec - Start.tv_sec +
284 (float)(Stop.tv_usec - Start.tv_usec)/1000000;
285 clog << "Got " << InP << " in " << Diff << " at " << InP/Diff << endl;*/
286}
287 /*}}}*/
288
289// ServerState::ServerState - Constructor /*{{{*/
290// ---------------------------------------------------------------------
291/* */
292ServerState::ServerState(URI Srv,HttpMethod *Owner) : Owner(Owner),
3000ccea 293 In(64*1024), Out(4*1024),
be4401bf
AL
294 ServerName(Srv)
295{
296 Reset();
297}
298 /*}}}*/
299// ServerState::Open - Open a connection to the server /*{{{*/
300// ---------------------------------------------------------------------
301/* This opens a connection to the server. */
be4401bf
AL
302bool ServerState::Open()
303{
92e889c8
AL
304 // Use the already open connection if possible.
305 if (ServerFd != -1)
306 return true;
307
be4401bf 308 Close();
492f957a
AL
309 In.Reset();
310 Out.Reset();
e836f356
AL
311 Persistent = true;
312
492f957a 313 // Determine the proxy setting
52e7839a 314 if (getenv("http_proxy") == 0)
492f957a 315 {
352c2768
AL
316 string DefProxy = _config->Find("Acquire::http::Proxy");
317 string SpecificProxy = _config->Find("Acquire::http::Proxy::" + ServerName.Host);
318 if (SpecificProxy.empty() == false)
319 {
320 if (SpecificProxy == "DIRECT")
321 Proxy = "";
322 else
323 Proxy = SpecificProxy;
324 }
492f957a 325 else
352c2768
AL
326 Proxy = DefProxy;
327 }
492f957a 328 else
352c2768
AL
329 Proxy = getenv("http_proxy");
330
f8081133 331 // Parse no_proxy, a , separated list of domains
9e2a06ff
AL
332 if (getenv("no_proxy") != 0)
333 {
f8081133
AL
334 if (CheckDomainList(ServerName.Host,getenv("no_proxy")) == true)
335 Proxy = "";
336 }
337
492f957a 338 // Determine what host and port to use based on the proxy settings
934b6582 339 int Port = 0;
492f957a 340 string Host;
dd1fd92b 341 if (Proxy.empty() == true || Proxy.Host.empty() == true)
be4401bf 342 {
92e889c8
AL
343 if (ServerName.Port != 0)
344 Port = ServerName.Port;
be4401bf
AL
345 Host = ServerName.Host;
346 }
347 else
348 {
92e889c8
AL
349 if (Proxy.Port != 0)
350 Port = Proxy.Port;
be4401bf
AL
351 Host = Proxy.Host;
352 }
353
0837bd25 354 // Connect to the remote server
9505213b 355 if (Connect(Host,Port,"http",80,ServerFd,TimeOut,Owner) == false)
0837bd25 356 return false;
3000ccea 357
be4401bf
AL
358 return true;
359}
360 /*}}}*/
361// ServerState::Close - Close a connection to the server /*{{{*/
362// ---------------------------------------------------------------------
363/* */
364bool ServerState::Close()
365{
366 close(ServerFd);
367 ServerFd = -1;
be4401bf
AL
368 return true;
369}
370 /*}}}*/
371// ServerState::RunHeaders - Get the headers before the data /*{{{*/
372// ---------------------------------------------------------------------
38965a34
MV
373/* Returns 0 if things are OK, 1 if an IO error occurred and 2 if a header
374 parse error occurred */
92e889c8 375int ServerState::RunHeaders()
be4401bf
AL
376{
377 State = Header;
378
519c5591 379 Owner->Status(_("Waiting for headers"));
be4401bf
AL
380
381 Major = 0;
382 Minor = 0;
383 Result = 0;
384 Size = 0;
385 StartPos = 0;
92e889c8
AL
386 Encoding = Closes;
387 HaveContent = false;
be4401bf
AL
388 time(&Date);
389
390 do
391 {
392 string Data;
393 if (In.WriteTillEl(Data) == false)
394 continue;
9d95e726
AL
395
396 if (Debug == true)
397 clog << Data;
be4401bf
AL
398
399 for (string::const_iterator I = Data.begin(); I < Data.end(); I++)
400 {
401 string::const_iterator J = I;
402 for (; J != Data.end() && *J != '\n' && *J != '\r';J++);
42195eb2 403 if (HeaderLine(string(I,J)) == false)
92e889c8 404 return 2;
be4401bf
AL
405 I = J;
406 }
e836f356 407
b2e465d6
AL
408 // 100 Continue is a Nop...
409 if (Result == 100)
410 continue;
411
e836f356
AL
412 // Tidy up the connection persistance state.
413 if (Encoding == Closes && HaveContent == true)
414 Persistent = false;
415
92e889c8 416 return 0;
be4401bf
AL
417 }
418 while (Owner->Go(false,this) == true);
e836f356 419
92e889c8 420 return 1;
be4401bf
AL
421}
422 /*}}}*/
423// ServerState::RunData - Transfer the data from the socket /*{{{*/
424// ---------------------------------------------------------------------
425/* */
426bool ServerState::RunData()
427{
428 State = Data;
429
430 // Chunked transfer encoding is fun..
431 if (Encoding == Chunked)
432 {
433 while (1)
434 {
435 // Grab the block size
436 bool Last = true;
437 string Data;
438 In.Limit(-1);
439 do
440 {
441 if (In.WriteTillEl(Data,true) == true)
442 break;
443 }
444 while ((Last = Owner->Go(false,this)) == true);
445
446 if (Last == false)
447 return false;
448
449 // See if we are done
450 unsigned long Len = strtol(Data.c_str(),0,16);
451 if (Len == 0)
452 {
453 In.Limit(-1);
454
455 // We have to remove the entity trailer
456 Last = true;
457 do
458 {
459 if (In.WriteTillEl(Data,true) == true && Data.length() <= 2)
460 break;
461 }
462 while ((Last = Owner->Go(false,this)) == true);
463 if (Last == false)
464 return false;
e1b96638 465 return !_error->PendingError();
be4401bf
AL
466 }
467
468 // Transfer the block
469 In.Limit(Len);
470 while (Owner->Go(true,this) == true)
471 if (In.IsLimit() == true)
472 break;
473
474 // Error
475 if (In.IsLimit() == false)
476 return false;
477
478 // The server sends an extra new line before the next block specifier..
479 In.Limit(-1);
480 Last = true;
481 do
482 {
483 if (In.WriteTillEl(Data,true) == true)
484 break;
485 }
486 while ((Last = Owner->Go(false,this)) == true);
487 if (Last == false)
488 return false;
92e889c8 489 }
be4401bf
AL
490 }
491 else
492 {
493 /* Closes encoding is used when the server did not specify a size, the
494 loss of the connection means we are done */
495 if (Encoding == Closes)
496 In.Limit(-1);
497 else
498 In.Limit(Size - StartPos);
499
500 // Just transfer the whole block.
501 do
502 {
503 if (In.IsLimit() == false)
504 continue;
505
506 In.Limit(-1);
e1b96638 507 return !_error->PendingError();
be4401bf
AL
508 }
509 while (Owner->Go(true,this) == true);
510 }
511
e1b96638 512 return Owner->Flush(this) && !_error->PendingError();
be4401bf
AL
513}
514 /*}}}*/
515// ServerState::HeaderLine - Process a header line /*{{{*/
516// ---------------------------------------------------------------------
517/* */
518bool ServerState::HeaderLine(string Line)
519{
520 if (Line.empty() == true)
521 return true;
30456e14 522
be4401bf
AL
523 // The http server might be trying to do something evil.
524 if (Line.length() >= MAXLEN)
dc738e7a 525 return _error->Error(_("Got a single header line over %u chars"),MAXLEN);
be4401bf
AL
526
527 string::size_type Pos = Line.find(' ');
528 if (Pos == string::npos || Pos+1 > Line.length())
c901051d
AL
529 {
530 // Blah, some servers use "connection:closes", evil.
531 Pos = Line.find(':');
532 if (Pos == string::npos || Pos + 2 > Line.length())
dc738e7a 533 return _error->Error(_("Bad header line"));
c901051d
AL
534 Pos++;
535 }
be4401bf 536
c901051d
AL
537 // Parse off any trailing spaces between the : and the next word.
538 string::size_type Pos2 = Pos;
539 while (Pos2 < Line.length() && isspace(Line[Pos2]) != 0)
540 Pos2++;
541
542 string Tag = string(Line,0,Pos);
543 string Val = string(Line,Pos2);
544
42195eb2 545 if (stringcasecmp(Tag.c_str(),Tag.c_str()+4,"HTTP") == 0)
be4401bf
AL
546 {
547 // Evil servers return no version
548 if (Line[4] == '/')
549 {
550 if (sscanf(Line.c_str(),"HTTP/%u.%u %u %[^\n]",&Major,&Minor,
551 &Result,Code) != 4)
db0db9fe 552 return _error->Error(_("The HTTP server sent an invalid reply header"));
be4401bf
AL
553 }
554 else
555 {
556 Major = 0;
557 Minor = 9;
558 if (sscanf(Line.c_str(),"HTTP %u %[^\n]",&Result,Code) != 2)
db0db9fe 559 return _error->Error(_("The HTTP server sent an invalid reply header"));
be4401bf 560 }
e836f356
AL
561
562 /* Check the HTTP response header to get the default persistance
563 state. */
564 if (Major < 1)
565 Persistent = false;
566 else
567 {
568 if (Major == 1 && Minor <= 0)
569 Persistent = false;
570 else
571 Persistent = true;
572 }
b2e465d6 573
be4401bf
AL
574 return true;
575 }
576
92e889c8 577 if (stringcasecmp(Tag,"Content-Length:") == 0)
be4401bf
AL
578 {
579 if (Encoding == Closes)
580 Encoding = Stream;
92e889c8 581 HaveContent = true;
be4401bf
AL
582
583 // The length is already set from the Content-Range header
584 if (StartPos != 0)
585 return true;
586
587 if (sscanf(Val.c_str(),"%lu",&Size) != 1)
db0db9fe 588 return _error->Error(_("The HTTP server sent an invalid Content-Length header"));
be4401bf
AL
589 return true;
590 }
591
92e889c8
AL
592 if (stringcasecmp(Tag,"Content-Type:") == 0)
593 {
594 HaveContent = true;
595 return true;
596 }
597
598 if (stringcasecmp(Tag,"Content-Range:") == 0)
be4401bf 599 {
92e889c8
AL
600 HaveContent = true;
601
be4401bf 602 if (sscanf(Val.c_str(),"bytes %lu-%*u/%lu",&StartPos,&Size) != 2)
db0db9fe 603 return _error->Error(_("The HTTP server sent an invalid Content-Range header"));
be4401bf 604 if ((unsigned)StartPos > Size)
db0db9fe 605 return _error->Error(_("This HTTP server has broken range support"));
be4401bf
AL
606 return true;
607 }
608
92e889c8 609 if (stringcasecmp(Tag,"Transfer-Encoding:") == 0)
be4401bf 610 {
92e889c8
AL
611 HaveContent = true;
612 if (stringcasecmp(Val,"chunked") == 0)
e836f356 613 Encoding = Chunked;
be4401bf
AL
614 return true;
615 }
616
e836f356
AL
617 if (stringcasecmp(Tag,"Connection:") == 0)
618 {
619 if (stringcasecmp(Val,"close") == 0)
620 Persistent = false;
621 if (stringcasecmp(Val,"keep-alive") == 0)
622 Persistent = true;
623 return true;
624 }
625
92e889c8 626 if (stringcasecmp(Tag,"Last-Modified:") == 0)
be4401bf
AL
627 {
628 if (StrToTime(Val,Date) == false)
dc738e7a 629 return _error->Error(_("Unknown date format"));
be4401bf
AL
630 return true;
631 }
632
15d7e515
MV
633 if (stringcasecmp(Tag,"Location:") == 0)
634 {
635 Location = Val;
636 return true;
637 }
638
be4401bf
AL
639 return true;
640}
641 /*}}}*/
642
643// HttpMethod::SendReq - Send the HTTP request /*{{{*/
644// ---------------------------------------------------------------------
645/* This places the http request in the outbound buffer */
646void HttpMethod::SendReq(FetchItem *Itm,CircleBuf &Out)
647{
648 URI Uri = Itm->Uri;
c1a22377 649
be4401bf 650 // The HTTP server expects a hostname with a trailing :port
c1a22377 651 char Buf[1000];
be4401bf
AL
652 string ProperHost = Uri.Host;
653 if (Uri.Port != 0)
654 {
655 sprintf(Buf,":%u",Uri.Port);
656 ProperHost += Buf;
657 }
658
c1a22377
AL
659 // Just in case.
660 if (Itm->Uri.length() >= sizeof(Buf))
661 abort();
662
492f957a
AL
663 /* Build the request. We include a keep-alive header only for non-proxy
664 requests. This is to tweak old http/1.0 servers that do support keep-alive
665 but not HTTP/1.1 automatic keep-alive. Doing this with a proxy server
666 will glitch HTTP/1.0 proxies because they do not filter it out and
667 pass it on, HTTP/1.1 says the connection should default to keep alive
668 and we expect the proxy to do this */
02b7ddb1 669 if (Proxy.empty() == true || Proxy.Host.empty())
be4401bf 670 sprintf(Buf,"GET %s HTTP/1.1\r\nHost: %s\r\nConnection: keep-alive\r\n",
a4edf53b 671 QuoteString(Uri.Path,"~").c_str(),ProperHost.c_str());
be4401bf 672 else
c1a22377
AL
673 {
674 /* Generate a cache control header if necessary. We place a max
675 cache age on index files, optionally set a no-cache directive
676 and a no-store directive for archives. */
be4401bf
AL
677 sprintf(Buf,"GET %s HTTP/1.1\r\nHost: %s\r\n",
678 Itm->Uri.c_str(),ProperHost.c_str());
106e6740
MV
679 // only generate a cache control header if we actually want to
680 // use a cache
681 if (_config->FindB("Acquire::http::No-Cache",false) == false)
c1a22377
AL
682 {
683 if (Itm->IndexFile == true)
684 sprintf(Buf+strlen(Buf),"Cache-Control: max-age=%u\r\n",
bcbe61ae 685 _config->FindI("Acquire::http::Max-Age",0));
c1a22377
AL
686 else
687 {
688 if (_config->FindB("Acquire::http::No-Store",false) == true)
689 strcat(Buf,"Cache-Control: no-store\r\n");
690 }
691 }
692 }
106e6740
MV
693 // generate a no-cache header if needed
694 if (_config->FindB("Acquire::http::No-Cache",false) == true)
695 strcat(Buf,"Cache-Control: no-cache\r\nPragma: no-cache\r\n");
696
c1a22377 697
be4401bf 698 string Req = Buf;
492f957a 699
be4401bf
AL
700 // Check for a partial file
701 struct stat SBuf;
702 if (stat(Itm->DestFile.c_str(),&SBuf) >= 0 && SBuf.st_size > 0)
703 {
704 // In this case we send an if-range query with a range header
1ae93c94 705 sprintf(Buf,"Range: bytes=%li-\r\nIf-Range: %s\r\n",(long)SBuf.st_size - 1,
be4401bf
AL
706 TimeRFC1123(SBuf.st_mtime).c_str());
707 Req += Buf;
708 }
709 else
710 {
711 if (Itm->LastModified != 0)
712 {
713 sprintf(Buf,"If-Modified-Since: %s\r\n",TimeRFC1123(Itm->LastModified).c_str());
714 Req += Buf;
715 }
716 }
717
8d64c395
AL
718 if (Proxy.User.empty() == false || Proxy.Password.empty() == false)
719 Req += string("Proxy-Authorization: Basic ") +
720 Base64Encode(Proxy.User + ":" + Proxy.Password) + "\r\n";
be4401bf 721
b2e465d6
AL
722 if (Uri.User.empty() == false || Uri.Password.empty() == false)
723 Req += string("Authorization: Basic ") +
724 Base64Encode(Uri.User + ":" + Uri.Password) + "\r\n";
725
59b46c41 726 Req += "User-Agent: Debian APT-HTTP/1.3 ("VERSION")\r\n\r\n";
c98b1307
AL
727
728 if (Debug == true)
729 cerr << Req << endl;
c1a22377 730
be4401bf
AL
731 Out.Read(Req);
732}
733 /*}}}*/
734// HttpMethod::Go - Run a single loop /*{{{*/
735// ---------------------------------------------------------------------
736/* This runs the select loop over the server FDs, Output file FDs and
737 stdin. */
738bool HttpMethod::Go(bool ToFile,ServerState *Srv)
739{
740 // Server has closed the connection
8195ae46
AL
741 if (Srv->ServerFd == -1 && (Srv->In.WriteSpace() == false ||
742 ToFile == false))
be4401bf
AL
743 return false;
744
d955fe80 745 fd_set rfds,wfds;
be4401bf
AL
746 FD_ZERO(&rfds);
747 FD_ZERO(&wfds);
be4401bf 748
e836f356
AL
749 /* Add the server. We only send more requests if the connection will
750 be persisting */
751 if (Srv->Out.WriteSpace() == true && Srv->ServerFd != -1
752 && Srv->Persistent == true)
be4401bf 753 FD_SET(Srv->ServerFd,&wfds);
e836f356 754 if (Srv->In.ReadSpace() == true && Srv->ServerFd != -1)
be4401bf
AL
755 FD_SET(Srv->ServerFd,&rfds);
756
757 // Add the file
758 int FileFD = -1;
759 if (File != 0)
760 FileFD = File->Fd();
761
762 if (Srv->In.WriteSpace() == true && ToFile == true && FileFD != -1)
763 FD_SET(FileFD,&wfds);
764
765 // Add stdin
766 FD_SET(STDIN_FILENO,&rfds);
767
be4401bf
AL
768 // Figure out the max fd
769 int MaxFd = FileFD;
770 if (MaxFd < Srv->ServerFd)
771 MaxFd = Srv->ServerFd;
8195ae46 772
be4401bf
AL
773 // Select
774 struct timeval tv;
3000ccea 775 tv.tv_sec = TimeOut;
be4401bf
AL
776 tv.tv_usec = 0;
777 int Res = 0;
d955fe80 778 if ((Res = select(MaxFd+1,&rfds,&wfds,0,&tv)) < 0)
c37b9502
AL
779 {
780 if (errno == EINTR)
781 return true;
dc738e7a 782 return _error->Errno("select",_("Select failed"));
c37b9502 783 }
be4401bf
AL
784
785 if (Res == 0)
786 {
dc738e7a 787 _error->Error(_("Connection timed out"));
be4401bf
AL
788 return ServerDie(Srv);
789 }
790
be4401bf
AL
791 // Handle server IO
792 if (Srv->ServerFd != -1 && FD_ISSET(Srv->ServerFd,&rfds))
793 {
794 errno = 0;
795 if (Srv->In.Read(Srv->ServerFd) == false)
796 return ServerDie(Srv);
797 }
798
799 if (Srv->ServerFd != -1 && FD_ISSET(Srv->ServerFd,&wfds))
800 {
801 errno = 0;
802 if (Srv->Out.Write(Srv->ServerFd) == false)
803 return ServerDie(Srv);
804 }
805
806 // Send data to the file
807 if (FileFD != -1 && FD_ISSET(FileFD,&wfds))
808 {
809 if (Srv->In.Write(FileFD) == false)
dc738e7a 810 return _error->Errno("write",_("Error writing to output file"));
be4401bf
AL
811 }
812
813 // Handle commands from APT
814 if (FD_ISSET(STDIN_FILENO,&rfds))
815 {
6920216d 816 if (Run(true) != -1)
be4401bf
AL
817 exit(100);
818 }
819
820 return true;
821}
822 /*}}}*/
823// HttpMethod::Flush - Dump the buffer into the file /*{{{*/
824// ---------------------------------------------------------------------
825/* This takes the current input buffer from the Server FD and writes it
826 into the file */
827bool HttpMethod::Flush(ServerState *Srv)
828{
829 if (File != 0)
830 {
b57c8bb4
MV
831 // on GNU/kFreeBSD, apt dies on /dev/null because non-blocking
832 // can't be set
833 if (File->Name() != "/dev/null")
834 SetNonBlock(File->Fd(),false);
be4401bf
AL
835 if (Srv->In.WriteSpace() == false)
836 return true;
837
838 while (Srv->In.WriteSpace() == true)
839 {
840 if (Srv->In.Write(File->Fd()) == false)
dc738e7a 841 return _error->Errno("write",_("Error writing to file"));
92e889c8
AL
842 if (Srv->In.IsLimit() == true)
843 return true;
be4401bf
AL
844 }
845
846 if (Srv->In.IsLimit() == true || Srv->Encoding == ServerState::Closes)
847 return true;
848 }
849 return false;
850}
851 /*}}}*/
852// HttpMethod::ServerDie - The server has closed the connection. /*{{{*/
853// ---------------------------------------------------------------------
854/* */
855bool HttpMethod::ServerDie(ServerState *Srv)
856{
2b154e53
AL
857 unsigned int LErrno = errno;
858
be4401bf
AL
859 // Dump the buffer to the file
860 if (Srv->State == ServerState::Data)
861 {
b57c8bb4
MV
862 // on GNU/kFreeBSD, apt dies on /dev/null because non-blocking
863 // can't be set
864 if (File->Name() != "/dev/null")
865 SetNonBlock(File->Fd(),false);
be4401bf
AL
866 while (Srv->In.WriteSpace() == true)
867 {
868 if (Srv->In.Write(File->Fd()) == false)
dc738e7a 869 return _error->Errno("write",_("Error writing to the file"));
92e889c8
AL
870
871 // Done
872 if (Srv->In.IsLimit() == true)
873 return true;
be4401bf
AL
874 }
875 }
876
877 // See if this is because the server finished the data stream
878 if (Srv->In.IsLimit() == false && Srv->State != ServerState::Header &&
879 Srv->Encoding != ServerState::Closes)
880 {
3d615484 881 Srv->Close();
2b154e53 882 if (LErrno == 0)
db0db9fe 883 return _error->Error(_("Error reading from server. Remote end closed connection"));
2b154e53 884 errno = LErrno;
dc738e7a 885 return _error->Errno("read",_("Error reading from server"));
be4401bf
AL
886 }
887 else
888 {
889 Srv->In.Limit(-1);
890
891 // Nothing left in the buffer
892 if (Srv->In.WriteSpace() == false)
893 return false;
894
895 // We may have got multiple responses back in one packet..
896 Srv->Close();
897 return true;
898 }
899
900 return false;
901}
902 /*}}}*/
903// HttpMethod::DealWithHeaders - Handle the retrieved header data /*{{{*/
904// ---------------------------------------------------------------------
905/* We look at the header data we got back from the server and decide what
906 to do. Returns
907 0 - File is open,
908 1 - IMS hit
92e889c8 909 3 - Unrecoverable error
94235cfb 910 4 - Error with error content page
15d7e515
MV
911 5 - Unrecoverable non-server error (close the connection)
912 6 - Try again with a new or changed URI
913 */
be4401bf
AL
914int HttpMethod::DealWithHeaders(FetchResult &Res,ServerState *Srv)
915{
916 // Not Modified
917 if (Srv->Result == 304)
918 {
919 unlink(Queue->DestFile.c_str());
920 Res.IMSHit = true;
921 Res.LastModified = Queue->LastModified;
922 return 1;
923 }
924
15d7e515
MV
925 /* Redirect
926 *
927 * Note that it is only OK for us to treat all redirection the same
928 * because we *always* use GET, not other HTTP methods. There are
929 * three redirection codes for which it is not appropriate that we
930 * redirect. Pass on those codes so the error handling kicks in.
931 */
932 if (AllowRedirect
933 && (Srv->Result > 300 && Srv->Result < 400)
934 && (Srv->Result != 300 // Multiple Choices
935 && Srv->Result != 304 // Not Modified
936 && Srv->Result != 306)) // (Not part of HTTP/1.1, reserved)
937 {
938 if (!Srv->Location.empty())
939 {
940 NextURI = Srv->Location;
941 return 6;
942 }
943 /* else pass through for error message */
944 }
945
be4401bf
AL
946 /* We have a reply we dont handle. This should indicate a perm server
947 failure */
948 if (Srv->Result < 200 || Srv->Result >= 300)
949 {
950 _error->Error("%u %s",Srv->Result,Srv->Code);
92e889c8
AL
951 if (Srv->HaveContent == true)
952 return 4;
be4401bf
AL
953 return 3;
954 }
955
956 // This is some sort of 2xx 'data follows' reply
957 Res.LastModified = Srv->Date;
958 Res.Size = Srv->Size;
959
960 // Open the file
961 delete File;
962 File = new FileFd(Queue->DestFile,FileFd::WriteAny);
963 if (_error->PendingError() == true)
94235cfb 964 return 5;
492f957a
AL
965
966 FailFile = Queue->DestFile;
30b30ec1 967 FailFile.c_str(); // Make sure we dont do a malloc in the signal handler
492f957a
AL
968 FailFd = File->Fd();
969 FailTime = Srv->Date;
970
be4401bf
AL
971 // Set the expected size
972 if (Srv->StartPos >= 0)
973 {
974 Res.ResumePoint = Srv->StartPos;
9b5d79ec
MV
975 if (ftruncate(File->Fd(),Srv->StartPos) < 0)
976 _error->Errno("ftruncate", _("Failed to truncate file"));
be4401bf
AL
977 }
978
979 // Set the start point
980 lseek(File->Fd(),0,SEEK_END);
981
63b1700f
AL
982 delete Srv->In.Hash;
983 Srv->In.Hash = new Hashes;
be4401bf 984
63b1700f 985 // Fill the Hash if the file is non-empty (resume)
be4401bf
AL
986 if (Srv->StartPos > 0)
987 {
988 lseek(File->Fd(),0,SEEK_SET);
63b1700f 989 if (Srv->In.Hash->AddFD(File->Fd(),Srv->StartPos) == false)
be4401bf 990 {
dc738e7a 991 _error->Errno("read",_("Problem hashing file"));
94235cfb 992 return 5;
be4401bf
AL
993 }
994 lseek(File->Fd(),0,SEEK_END);
995 }
996
997 SetNonBlock(File->Fd(),true);
998 return 0;
999}
1000 /*}}}*/
492f957a
AL
1001// HttpMethod::SigTerm - Handle a fatal signal /*{{{*/
1002// ---------------------------------------------------------------------
1003/* This closes and timestamps the open file. This is neccessary to get
1004 resume behavoir on user abort */
1005void HttpMethod::SigTerm(int)
1006{
1007 if (FailFd == -1)
ffe9323a 1008 _exit(100);
492f957a
AL
1009 close(FailFd);
1010
1011 // Timestamp
1012 struct utimbuf UBuf;
492f957a
AL
1013 UBuf.actime = FailTime;
1014 UBuf.modtime = FailTime;
1015 utime(FailFile.c_str(),&UBuf);
1016
ffe9323a 1017 _exit(100);
492f957a
AL
1018}
1019 /*}}}*/
5cb5d8dc
AL
1020// HttpMethod::Fetch - Fetch an item /*{{{*/
1021// ---------------------------------------------------------------------
1022/* This adds an item to the pipeline. We keep the pipeline at a fixed
1023 depth. */
1024bool HttpMethod::Fetch(FetchItem *)
1025{
1026 if (Server == 0)
1027 return true;
3000ccea 1028
5cb5d8dc
AL
1029 // Queue the requests
1030 int Depth = -1;
f93d1355
AL
1031 for (FetchItem *I = Queue; I != 0 && Depth < (signed)PipelineDepth;
1032 I = I->Next, Depth++)
5cb5d8dc 1033 {
f93d1355
AL
1034 // If pipelining is disabled, we only queue 1 request
1035 if (Server->Pipeline == false && Depth >= 0)
1036 break;
1037
5cb5d8dc
AL
1038 // Make sure we stick with the same server
1039 if (Server->Comp(I->Uri) == false)
1040 break;
5cb5d8dc 1041 if (QueueBack == I)
5cb5d8dc 1042 {
5cb5d8dc
AL
1043 QueueBack = I->Next;
1044 SendReq(I,Server->Out);
1045 continue;
f93d1355 1046 }
5cb5d8dc
AL
1047 }
1048
1049 return true;
1050};
1051 /*}}}*/
85f72a56
AL
1052// HttpMethod::Configuration - Handle a configuration message /*{{{*/
1053// ---------------------------------------------------------------------
1054/* We stash the desired pipeline depth */
1055bool HttpMethod::Configuration(string Message)
1056{
1057 if (pkgAcqMethod::Configuration(Message) == false)
1058 return false;
1059
15d7e515 1060 AllowRedirect = _config->FindB("Acquire::http::AllowRedirect",true);
30456e14
AL
1061 TimeOut = _config->FindI("Acquire::http::Timeout",TimeOut);
1062 PipelineDepth = _config->FindI("Acquire::http::Pipeline-Depth",
1063 PipelineDepth);
c98b1307 1064 Debug = _config->FindB("Debug::Acquire::http",false);
3000ccea 1065
85f72a56
AL
1066 return true;
1067}
1068 /*}}}*/
492f957a 1069// HttpMethod::Loop - Main loop /*{{{*/
be4401bf
AL
1070// ---------------------------------------------------------------------
1071/* */
1072int HttpMethod::Loop()
1073{
15d7e515
MV
1074 typedef vector<string> StringVector;
1075 typedef vector<string>::iterator StringVectorIterator;
1076 map<string, StringVector> Redirected;
1077
492f957a
AL
1078 signal(SIGTERM,SigTerm);
1079 signal(SIGINT,SigTerm);
1080
5cb5d8dc 1081 Server = 0;
be4401bf 1082
92e889c8 1083 int FailCounter = 0;
be4401bf 1084 while (1)
2b154e53 1085 {
be4401bf
AL
1086 // We have no commands, wait for some to arrive
1087 if (Queue == 0)
1088 {
1089 if (WaitFd(STDIN_FILENO) == false)
1090 return 0;
1091 }
1092
6920216d
AL
1093 /* Run messages, we can accept 0 (no message) if we didn't
1094 do a WaitFd above.. Otherwise the FD is closed. */
1095 int Result = Run(true);
1096 if (Result != -1 && (Result != 0 || Queue == 0))
be4401bf
AL
1097 return 100;
1098
1099 if (Queue == 0)
1100 continue;
1101
1102 // Connect to the server
1103 if (Server == 0 || Server->Comp(Queue->Uri) == false)
1104 {
1105 delete Server;
1106 Server = new ServerState(Queue->Uri,this);
1107 }
e836f356
AL
1108 /* If the server has explicitly said this is the last connection
1109 then we pre-emptively shut down the pipeline and tear down
1110 the connection. This will speed up HTTP/1.0 servers a tad
1111 since we don't have to wait for the close sequence to
1112 complete */
1113 if (Server->Persistent == false)
1114 Server->Close();
1115
a7fb252c
AL
1116 // Reset the pipeline
1117 if (Server->ServerFd == -1)
1118 QueueBack = Queue;
1119
be4401bf
AL
1120 // Connnect to the host
1121 if (Server->Open() == false)
1122 {
43252d15 1123 Fail(true);
a1459f52
AL
1124 delete Server;
1125 Server = 0;
be4401bf
AL
1126 continue;
1127 }
be4401bf 1128
5cb5d8dc
AL
1129 // Fill the pipeline.
1130 Fetch(0);
1131
92e889c8
AL
1132 // Fetch the next URL header data from the server.
1133 switch (Server->RunHeaders())
be4401bf 1134 {
92e889c8
AL
1135 case 0:
1136 break;
1137
1138 // The header data is bad
1139 case 2:
1140 {
db0db9fe 1141 _error->Error(_("Bad header data"));
43252d15 1142 Fail(true);
b2e465d6 1143 RotateDNS();
92e889c8
AL
1144 continue;
1145 }
1146
1147 // The server closed a connection during the header get..
1148 default:
1149 case 1:
1150 {
1151 FailCounter++;
3d615484 1152 _error->Discard();
92e889c8 1153 Server->Close();
f93d1355
AL
1154 Server->Pipeline = false;
1155
2b154e53
AL
1156 if (FailCounter >= 2)
1157 {
dc738e7a 1158 Fail(_("Connection failed"),true);
2b154e53
AL
1159 FailCounter = 0;
1160 }
1161
b2e465d6 1162 RotateDNS();
92e889c8
AL
1163 continue;
1164 }
1165 };
5cb5d8dc 1166
be4401bf
AL
1167 // Decide what to do.
1168 FetchResult Res;
bfd22fc0 1169 Res.Filename = Queue->DestFile;
be4401bf
AL
1170 switch (DealWithHeaders(Res,Server))
1171 {
1172 // Ok, the file is Open
1173 case 0:
1174 {
1175 URIStart(Res);
1176
1177 // Run the data
492f957a
AL
1178 bool Result = Server->RunData();
1179
b2e465d6
AL
1180 /* If the server is sending back sizeless responses then fill in
1181 the size now */
1182 if (Res.Size == 0)
1183 Res.Size = File->Size();
1184
492f957a
AL
1185 // Close the file, destroy the FD object and timestamp it
1186 FailFd = -1;
1187 delete File;
1188 File = 0;
1189
1190 // Timestamp
1191 struct utimbuf UBuf;
1192 time(&UBuf.actime);
1193 UBuf.actime = Server->Date;
1194 UBuf.modtime = Server->Date;
1195 utime(Queue->DestFile.c_str(),&UBuf);
1196
1197 // Send status to APT
1198 if (Result == true)
92e889c8 1199 {
a7c835af 1200 Res.TakeHashes(*Server->In.Hash);
92e889c8
AL
1201 URIDone(Res);
1202 }
492f957a 1203 else
82d0afc2
MV
1204 {
1205 if (Server->ServerFd == -1)
1206 {
1207 FailCounter++;
1208 _error->Discard();
1209 Server->Close();
1210
1211 if (FailCounter >= 2)
9a52beaa 1212 {
82d0afc2
MV
1213 Fail(_("Connection failed"),true);
1214 FailCounter = 0;
9a52beaa 1215 }
82d0afc2
MV
1216
1217 QueueBack = Queue;
1218 }
1219 else
1220 Fail(true);
1221 }
be4401bf
AL
1222 break;
1223 }
1224
1225 // IMS hit
1226 case 1:
1227 {
1228 URIDone(Res);
1229 break;
1230 }
1231
1232 // Hard server error, not found or something
1233 case 3:
1234 {
1235 Fail();
1236 break;
1237 }
94235cfb
AL
1238
1239 // Hard internal error, kill the connection and fail
1240 case 5:
1241 {
a305f593
AL
1242 delete File;
1243 File = 0;
1244
94235cfb 1245 Fail();
b2e465d6 1246 RotateDNS();
94235cfb
AL
1247 Server->Close();
1248 break;
1249 }
92e889c8
AL
1250
1251 // We need to flush the data, the header is like a 404 w/ error text
1252 case 4:
1253 {
1254 Fail();
1255
1256 // Send to content to dev/null
1257 File = new FileFd("/dev/null",FileFd::WriteExists);
1258 Server->RunData();
1259 delete File;
1260 File = 0;
1261 break;
1262 }
be4401bf 1263
15d7e515
MV
1264 // Try again with a new URL
1265 case 6:
1266 {
1267 // Clear rest of response if there is content
1268 if (Server->HaveContent)
1269 {
1270 File = new FileFd("/dev/null",FileFd::WriteExists);
1271 Server->RunData();
1272 delete File;
1273 File = 0;
1274 }
1275
1276 /* Detect redirect loops. No more redirects are allowed
1277 after the same URI is seen twice in a queue item. */
1278 StringVector &R = Redirected[Queue->DestFile];
1279 bool StopRedirects = false;
1280 if (R.size() == 0)
1281 R.push_back(Queue->Uri);
1282 else if (R[0] == "STOP" || R.size() > 10)
1283 StopRedirects = true;
1284 else
1285 {
1286 for (StringVectorIterator I = R.begin(); I != R.end(); I++)
1287 if (Queue->Uri == *I)
1288 {
1289 R[0] = "STOP";
1290 break;
1291 }
1292
1293 R.push_back(Queue->Uri);
1294 }
1295
1296 if (StopRedirects == false)
1297 Redirect(NextURI);
1298 else
1299 Fail();
1300
1301 break;
1302 }
1303
be4401bf 1304 default:
dc738e7a 1305 Fail(_("Internal error"));
be4401bf 1306 break;
92e889c8
AL
1307 }
1308
1309 FailCounter = 0;
be4401bf
AL
1310 }
1311
1312 return 0;
1313}
1314 /*}}}*/
1315
1316int main()
1317{
049c0171 1318 setlocale(LC_ALL, "");
ab7f4d7c
MV
1319 // ignore SIGPIPE, this can happen on write() if the socket
1320 // closes the connection (this is dealt with via ServerDie())
1321 signal(SIGPIPE, SIG_IGN);
049c0171 1322
be4401bf 1323 HttpMethod Mth;
be4401bf
AL
1324 return Mth.Loop();
1325}
a305f593
AL
1326
1327