* merged with debian-sid branch
[ntk/apt.git] / methods / http.cc
CommitLineData
be4401bf
AL
1// -*- mode: cpp; mode: fold -*-
2// Description /*{{{*/
2cbcabd8 3// $Id: http.cc,v 1.59 2004/05/08 19:42:35 mdz Exp $
be4401bf
AL
4/* ######################################################################
5
6 HTTP Aquire Method - This is the HTTP aquire method for APT.
7
8 It uses HTTP/1.1 and many of the fancy options there-in, such as
e836f356
AL
9 pipelining, range, if-range and so on.
10
11 It is based on a doubly buffered select loop. A groupe of requests are
be4401bf
AL
12 fed into a single output buffer that is constantly fed out the
13 socket. This provides ideal pipelining as in many cases all of the
14 requests will fit into a single packet. The input socket is buffered
e836f356 15 the same way and fed into the fd for the file (may be a pipe in future).
be4401bf
AL
16
17 This double buffering provides fairly substantial transfer rates,
18 compared to wget the http method is about 4% faster. Most importantly,
19 when HTTP is compared with FTP as a protocol the speed difference is
20 huge. In tests over the internet from two sites to llug (via ATM) this
21 program got 230k/s sustained http transfer rates. FTP on the other
22 hand topped out at 170k/s. That combined with the time to setup the
23 FTP connection makes HTTP a vastly superior protocol.
24
25 ##################################################################### */
26 /*}}}*/
27// Include Files /*{{{*/
28#include <apt-pkg/fileutl.h>
29#include <apt-pkg/acquire-method.h>
30#include <apt-pkg/error.h>
63b1700f 31#include <apt-pkg/hashes.h>
be4401bf
AL
32
33#include <sys/stat.h>
34#include <sys/time.h>
35#include <utime.h>
36#include <unistd.h>
492f957a 37#include <signal.h>
be4401bf 38#include <stdio.h>
65a1e968 39#include <errno.h>
42195eb2
AL
40#include <string.h>
41#include <iostream>
d77559ac 42#include <apti18n.h>
be4401bf
AL
43
44// Internet stuff
0837bd25 45#include <netdb.h>
be4401bf 46
0837bd25 47#include "connect.h"
934b6582 48#include "rfc2553emu.h"
be4401bf 49#include "http.h"
934b6582 50
be4401bf 51 /*}}}*/
42195eb2 52using namespace std;
be4401bf 53
492f957a
AL
54string HttpMethod::FailFile;
55int HttpMethod::FailFd = -1;
56time_t HttpMethod::FailTime = 0;
3000ccea
AL
57unsigned long PipelineDepth = 10;
58unsigned long TimeOut = 120;
c98b1307 59bool Debug = false;
492f957a 60
7c6e2dc7
MV
61unsigned long CircleBuf::BwReadLimit=0;
62unsigned long CircleBuf::BwTickReadData=0;
63struct timeval CircleBuf::BwReadTick={0,0};
64const unsigned int CircleBuf::BW_HZ=10;
65
be4401bf
AL
66// CircleBuf::CircleBuf - Circular input buffer /*{{{*/
67// ---------------------------------------------------------------------
68/* */
63b1700f 69CircleBuf::CircleBuf(unsigned long Size) : Size(Size), Hash(0)
be4401bf
AL
70{
71 Buf = new unsigned char[Size];
72 Reset();
7c6e2dc7
MV
73
74 CircleBuf::BwReadLimit = _config->FindI("Acquire::http::Dl-Limit",0)*1024;
be4401bf
AL
75}
76 /*}}}*/
77// CircleBuf::Reset - Reset to the default state /*{{{*/
78// ---------------------------------------------------------------------
79/* */
80void CircleBuf::Reset()
81{
82 InP = 0;
83 OutP = 0;
84 StrPos = 0;
85 MaxGet = (unsigned int)-1;
86 OutQueue = string();
63b1700f 87 if (Hash != 0)
be4401bf 88 {
63b1700f
AL
89 delete Hash;
90 Hash = new Hashes;
be4401bf
AL
91 }
92};
93 /*}}}*/
94// CircleBuf::Read - Read from a FD into the circular buffer /*{{{*/
95// ---------------------------------------------------------------------
96/* This fills up the buffer with as much data as is in the FD, assuming it
97 is non-blocking.. */
98bool CircleBuf::Read(int Fd)
99{
7c6e2dc7
MV
100 unsigned long BwReadMax;
101
be4401bf
AL
102 while (1)
103 {
104 // Woops, buffer is full
105 if (InP - OutP == Size)
106 return true;
2c386259 107
7c6e2dc7
MV
108 // what's left to read in this tick
109 BwReadMax = CircleBuf::BwReadLimit/BW_HZ;
110
111 if(CircleBuf::BwReadLimit) {
112 struct timeval now;
113 gettimeofday(&now,0);
114
115 unsigned long d = (now.tv_sec-CircleBuf::BwReadTick.tv_sec)*1000000 +
116 now.tv_usec-CircleBuf::BwReadTick.tv_usec;
117 if(d > 1000000/BW_HZ) {
118 CircleBuf::BwReadTick = now;
119 CircleBuf::BwTickReadData = 0;
120 }
121
122 if(CircleBuf::BwTickReadData >= BwReadMax) {
123 usleep(1000000/BW_HZ);
124 return true;
125 }
126 }
127
be4401bf
AL
128 // Write the buffer segment
129 int Res;
7c6e2dc7
MV
130 if(CircleBuf::BwReadLimit) {
131 Res = read(Fd,Buf + (InP%Size),
132 BwReadMax > LeftRead() ? LeftRead() : BwReadMax);
133 } else
134 Res = read(Fd,Buf + (InP%Size),LeftRead());
be4401bf 135
7c6e2dc7
MV
136 if(Res > 0 && BwReadLimit > 0)
137 CircleBuf::BwTickReadData += Res;
138
be4401bf
AL
139 if (Res == 0)
140 return false;
141 if (Res < 0)
142 {
143 if (errno == EAGAIN)
144 return true;
145 return false;
146 }
147
148 if (InP == 0)
149 gettimeofday(&Start,0);
150 InP += Res;
151 }
152}
153 /*}}}*/
154// CircleBuf::Read - Put the string into the buffer /*{{{*/
155// ---------------------------------------------------------------------
156/* This will hold the string in and fill the buffer with it as it empties */
157bool CircleBuf::Read(string Data)
158{
159 OutQueue += Data;
160 FillOut();
161 return true;
162}
163 /*}}}*/
164// CircleBuf::FillOut - Fill the buffer from the output queue /*{{{*/
165// ---------------------------------------------------------------------
166/* */
167void CircleBuf::FillOut()
168{
169 if (OutQueue.empty() == true)
170 return;
171 while (1)
172 {
173 // Woops, buffer is full
174 if (InP - OutP == Size)
175 return;
176
177 // Write the buffer segment
178 unsigned long Sz = LeftRead();
179 if (OutQueue.length() - StrPos < Sz)
180 Sz = OutQueue.length() - StrPos;
42195eb2 181 memcpy(Buf + (InP%Size),OutQueue.c_str() + StrPos,Sz);
be4401bf
AL
182
183 // Advance
184 StrPos += Sz;
185 InP += Sz;
186 if (OutQueue.length() == StrPos)
187 {
188 StrPos = 0;
189 OutQueue = "";
190 return;
191 }
192 }
193}
194 /*}}}*/
195// CircleBuf::Write - Write from the buffer into a FD /*{{{*/
196// ---------------------------------------------------------------------
197/* This empties the buffer into the FD. */
198bool CircleBuf::Write(int Fd)
199{
200 while (1)
201 {
202 FillOut();
203
204 // Woops, buffer is empty
205 if (OutP == InP)
206 return true;
207
208 if (OutP == MaxGet)
209 return true;
210
211 // Write the buffer segment
212 int Res;
213 Res = write(Fd,Buf + (OutP%Size),LeftWrite());
214
215 if (Res == 0)
216 return false;
217 if (Res < 0)
218 {
219 if (errno == EAGAIN)
220 return true;
221
222 return false;
223 }
224
63b1700f
AL
225 if (Hash != 0)
226 Hash->Add(Buf + (OutP%Size),Res);
be4401bf
AL
227
228 OutP += Res;
229 }
230}
231 /*}}}*/
232// CircleBuf::WriteTillEl - Write from the buffer to a string /*{{{*/
233// ---------------------------------------------------------------------
234/* This copies till the first empty line */
235bool CircleBuf::WriteTillEl(string &Data,bool Single)
236{
237 // We cheat and assume it is unneeded to have more than one buffer load
238 for (unsigned long I = OutP; I < InP; I++)
239 {
240 if (Buf[I%Size] != '\n')
241 continue;
2cbcabd8 242 ++I;
be4401bf
AL
243
244 if (Single == false)
245 {
2cbcabd8
AL
246 if (I < InP && Buf[I%Size] == '\r')
247 ++I;
927c393f
MV
248 if (I >= InP || Buf[I%Size] != '\n')
249 continue;
250 ++I;
be4401bf
AL
251 }
252
be4401bf
AL
253 Data = "";
254 while (OutP < I)
255 {
256 unsigned long Sz = LeftWrite();
257 if (Sz == 0)
258 return false;
927c393f 259 if (I - OutP < Sz)
be4401bf
AL
260 Sz = I - OutP;
261 Data += string((char *)(Buf + (OutP%Size)),Sz);
262 OutP += Sz;
263 }
264 return true;
265 }
266 return false;
267}
268 /*}}}*/
269// CircleBuf::Stats - Print out stats information /*{{{*/
270// ---------------------------------------------------------------------
271/* */
272void CircleBuf::Stats()
273{
274 if (InP == 0)
275 return;
276
277 struct timeval Stop;
278 gettimeofday(&Stop,0);
279/* float Diff = Stop.tv_sec - Start.tv_sec +
280 (float)(Stop.tv_usec - Start.tv_usec)/1000000;
281 clog << "Got " << InP << " in " << Diff << " at " << InP/Diff << endl;*/
282}
283 /*}}}*/
284
285// ServerState::ServerState - Constructor /*{{{*/
286// ---------------------------------------------------------------------
287/* */
288ServerState::ServerState(URI Srv,HttpMethod *Owner) : Owner(Owner),
3000ccea 289 In(64*1024), Out(4*1024),
be4401bf
AL
290 ServerName(Srv)
291{
292 Reset();
293}
294 /*}}}*/
295// ServerState::Open - Open a connection to the server /*{{{*/
296// ---------------------------------------------------------------------
297/* This opens a connection to the server. */
be4401bf
AL
298bool ServerState::Open()
299{
92e889c8
AL
300 // Use the already open connection if possible.
301 if (ServerFd != -1)
302 return true;
303
be4401bf 304 Close();
492f957a
AL
305 In.Reset();
306 Out.Reset();
e836f356
AL
307 Persistent = true;
308
492f957a 309 // Determine the proxy setting
52e7839a 310 if (getenv("http_proxy") == 0)
492f957a 311 {
352c2768
AL
312 string DefProxy = _config->Find("Acquire::http::Proxy");
313 string SpecificProxy = _config->Find("Acquire::http::Proxy::" + ServerName.Host);
314 if (SpecificProxy.empty() == false)
315 {
316 if (SpecificProxy == "DIRECT")
317 Proxy = "";
318 else
319 Proxy = SpecificProxy;
320 }
492f957a 321 else
352c2768
AL
322 Proxy = DefProxy;
323 }
492f957a 324 else
352c2768
AL
325 Proxy = getenv("http_proxy");
326
f8081133 327 // Parse no_proxy, a , separated list of domains
9e2a06ff
AL
328 if (getenv("no_proxy") != 0)
329 {
f8081133
AL
330 if (CheckDomainList(ServerName.Host,getenv("no_proxy")) == true)
331 Proxy = "";
332 }
333
492f957a 334 // Determine what host and port to use based on the proxy settings
934b6582 335 int Port = 0;
492f957a 336 string Host;
dd1fd92b 337 if (Proxy.empty() == true || Proxy.Host.empty() == true)
be4401bf 338 {
92e889c8
AL
339 if (ServerName.Port != 0)
340 Port = ServerName.Port;
be4401bf
AL
341 Host = ServerName.Host;
342 }
343 else
344 {
92e889c8
AL
345 if (Proxy.Port != 0)
346 Port = Proxy.Port;
be4401bf
AL
347 Host = Proxy.Host;
348 }
349
0837bd25 350 // Connect to the remote server
9505213b 351 if (Connect(Host,Port,"http",80,ServerFd,TimeOut,Owner) == false)
0837bd25 352 return false;
3000ccea 353
be4401bf
AL
354 return true;
355}
356 /*}}}*/
357// ServerState::Close - Close a connection to the server /*{{{*/
358// ---------------------------------------------------------------------
359/* */
360bool ServerState::Close()
361{
362 close(ServerFd);
363 ServerFd = -1;
be4401bf
AL
364 return true;
365}
366 /*}}}*/
367// ServerState::RunHeaders - Get the headers before the data /*{{{*/
368// ---------------------------------------------------------------------
92e889c8
AL
369/* Returns 0 if things are OK, 1 if an IO error occursed and 2 if a header
370 parse error occured */
371int ServerState::RunHeaders()
be4401bf
AL
372{
373 State = Header;
374
519c5591 375 Owner->Status(_("Waiting for headers"));
be4401bf
AL
376
377 Major = 0;
378 Minor = 0;
379 Result = 0;
380 Size = 0;
381 StartPos = 0;
92e889c8
AL
382 Encoding = Closes;
383 HaveContent = false;
be4401bf
AL
384 time(&Date);
385
386 do
387 {
388 string Data;
389 if (In.WriteTillEl(Data) == false)
390 continue;
9d95e726
AL
391
392 if (Debug == true)
393 clog << Data;
be4401bf
AL
394
395 for (string::const_iterator I = Data.begin(); I < Data.end(); I++)
396 {
397 string::const_iterator J = I;
398 for (; J != Data.end() && *J != '\n' && *J != '\r';J++);
42195eb2 399 if (HeaderLine(string(I,J)) == false)
92e889c8 400 return 2;
be4401bf
AL
401 I = J;
402 }
e836f356 403
b2e465d6
AL
404 // 100 Continue is a Nop...
405 if (Result == 100)
406 continue;
407
e836f356
AL
408 // Tidy up the connection persistance state.
409 if (Encoding == Closes && HaveContent == true)
410 Persistent = false;
411
92e889c8 412 return 0;
be4401bf
AL
413 }
414 while (Owner->Go(false,this) == true);
e836f356 415
92e889c8 416 return 1;
be4401bf
AL
417}
418 /*}}}*/
419// ServerState::RunData - Transfer the data from the socket /*{{{*/
420// ---------------------------------------------------------------------
421/* */
422bool ServerState::RunData()
423{
424 State = Data;
425
426 // Chunked transfer encoding is fun..
427 if (Encoding == Chunked)
428 {
429 while (1)
430 {
431 // Grab the block size
432 bool Last = true;
433 string Data;
434 In.Limit(-1);
435 do
436 {
437 if (In.WriteTillEl(Data,true) == true)
438 break;
439 }
440 while ((Last = Owner->Go(false,this)) == true);
441
442 if (Last == false)
443 return false;
444
445 // See if we are done
446 unsigned long Len = strtol(Data.c_str(),0,16);
447 if (Len == 0)
448 {
449 In.Limit(-1);
450
451 // We have to remove the entity trailer
452 Last = true;
453 do
454 {
455 if (In.WriteTillEl(Data,true) == true && Data.length() <= 2)
456 break;
457 }
458 while ((Last = Owner->Go(false,this)) == true);
459 if (Last == false)
460 return false;
e1b96638 461 return !_error->PendingError();
be4401bf
AL
462 }
463
464 // Transfer the block
465 In.Limit(Len);
466 while (Owner->Go(true,this) == true)
467 if (In.IsLimit() == true)
468 break;
469
470 // Error
471 if (In.IsLimit() == false)
472 return false;
473
474 // The server sends an extra new line before the next block specifier..
475 In.Limit(-1);
476 Last = true;
477 do
478 {
479 if (In.WriteTillEl(Data,true) == true)
480 break;
481 }
482 while ((Last = Owner->Go(false,this)) == true);
483 if (Last == false)
484 return false;
92e889c8 485 }
be4401bf
AL
486 }
487 else
488 {
489 /* Closes encoding is used when the server did not specify a size, the
490 loss of the connection means we are done */
491 if (Encoding == Closes)
492 In.Limit(-1);
493 else
494 In.Limit(Size - StartPos);
495
496 // Just transfer the whole block.
497 do
498 {
499 if (In.IsLimit() == false)
500 continue;
501
502 In.Limit(-1);
e1b96638 503 return !_error->PendingError();
be4401bf
AL
504 }
505 while (Owner->Go(true,this) == true);
506 }
507
e1b96638 508 return Owner->Flush(this) && !_error->PendingError();
be4401bf
AL
509}
510 /*}}}*/
511// ServerState::HeaderLine - Process a header line /*{{{*/
512// ---------------------------------------------------------------------
513/* */
514bool ServerState::HeaderLine(string Line)
515{
516 if (Line.empty() == true)
517 return true;
30456e14 518
be4401bf
AL
519 // The http server might be trying to do something evil.
520 if (Line.length() >= MAXLEN)
dc738e7a 521 return _error->Error(_("Got a single header line over %u chars"),MAXLEN);
be4401bf
AL
522
523 string::size_type Pos = Line.find(' ');
524 if (Pos == string::npos || Pos+1 > Line.length())
c901051d
AL
525 {
526 // Blah, some servers use "connection:closes", evil.
527 Pos = Line.find(':');
528 if (Pos == string::npos || Pos + 2 > Line.length())
dc738e7a 529 return _error->Error(_("Bad header line"));
c901051d
AL
530 Pos++;
531 }
be4401bf 532
c901051d
AL
533 // Parse off any trailing spaces between the : and the next word.
534 string::size_type Pos2 = Pos;
535 while (Pos2 < Line.length() && isspace(Line[Pos2]) != 0)
536 Pos2++;
537
538 string Tag = string(Line,0,Pos);
539 string Val = string(Line,Pos2);
540
42195eb2 541 if (stringcasecmp(Tag.c_str(),Tag.c_str()+4,"HTTP") == 0)
be4401bf
AL
542 {
543 // Evil servers return no version
544 if (Line[4] == '/')
545 {
546 if (sscanf(Line.c_str(),"HTTP/%u.%u %u %[^\n]",&Major,&Minor,
547 &Result,Code) != 4)
db0db9fe 548 return _error->Error(_("The HTTP server sent an invalid reply header"));
be4401bf
AL
549 }
550 else
551 {
552 Major = 0;
553 Minor = 9;
554 if (sscanf(Line.c_str(),"HTTP %u %[^\n]",&Result,Code) != 2)
db0db9fe 555 return _error->Error(_("The HTTP server sent an invalid reply header"));
be4401bf 556 }
e836f356
AL
557
558 /* Check the HTTP response header to get the default persistance
559 state. */
560 if (Major < 1)
561 Persistent = false;
562 else
563 {
564 if (Major == 1 && Minor <= 0)
565 Persistent = false;
566 else
567 Persistent = true;
568 }
b2e465d6 569
be4401bf
AL
570 return true;
571 }
572
92e889c8 573 if (stringcasecmp(Tag,"Content-Length:") == 0)
be4401bf
AL
574 {
575 if (Encoding == Closes)
576 Encoding = Stream;
92e889c8 577 HaveContent = true;
be4401bf
AL
578
579 // The length is already set from the Content-Range header
580 if (StartPos != 0)
581 return true;
582
583 if (sscanf(Val.c_str(),"%lu",&Size) != 1)
db0db9fe 584 return _error->Error(_("The HTTP server sent an invalid Content-Length header"));
be4401bf
AL
585 return true;
586 }
587
92e889c8
AL
588 if (stringcasecmp(Tag,"Content-Type:") == 0)
589 {
590 HaveContent = true;
591 return true;
592 }
593
594 if (stringcasecmp(Tag,"Content-Range:") == 0)
be4401bf 595 {
92e889c8
AL
596 HaveContent = true;
597
be4401bf 598 if (sscanf(Val.c_str(),"bytes %lu-%*u/%lu",&StartPos,&Size) != 2)
db0db9fe 599 return _error->Error(_("The HTTP server sent an invalid Content-Range header"));
be4401bf 600 if ((unsigned)StartPos > Size)
db0db9fe 601 return _error->Error(_("This HTTP server has broken range support"));
be4401bf
AL
602 return true;
603 }
604
92e889c8 605 if (stringcasecmp(Tag,"Transfer-Encoding:") == 0)
be4401bf 606 {
92e889c8
AL
607 HaveContent = true;
608 if (stringcasecmp(Val,"chunked") == 0)
e836f356 609 Encoding = Chunked;
be4401bf
AL
610 return true;
611 }
612
e836f356
AL
613 if (stringcasecmp(Tag,"Connection:") == 0)
614 {
615 if (stringcasecmp(Val,"close") == 0)
616 Persistent = false;
617 if (stringcasecmp(Val,"keep-alive") == 0)
618 Persistent = true;
619 return true;
620 }
621
92e889c8 622 if (stringcasecmp(Tag,"Last-Modified:") == 0)
be4401bf
AL
623 {
624 if (StrToTime(Val,Date) == false)
dc738e7a 625 return _error->Error(_("Unknown date format"));
be4401bf
AL
626 return true;
627 }
628
629 return true;
630}
631 /*}}}*/
632
633// HttpMethod::SendReq - Send the HTTP request /*{{{*/
634// ---------------------------------------------------------------------
635/* This places the http request in the outbound buffer */
636void HttpMethod::SendReq(FetchItem *Itm,CircleBuf &Out)
637{
638 URI Uri = Itm->Uri;
c1a22377 639
be4401bf 640 // The HTTP server expects a hostname with a trailing :port
c1a22377 641 char Buf[1000];
be4401bf
AL
642 string ProperHost = Uri.Host;
643 if (Uri.Port != 0)
644 {
645 sprintf(Buf,":%u",Uri.Port);
646 ProperHost += Buf;
647 }
648
c1a22377
AL
649 // Just in case.
650 if (Itm->Uri.length() >= sizeof(Buf))
651 abort();
652
492f957a
AL
653 /* Build the request. We include a keep-alive header only for non-proxy
654 requests. This is to tweak old http/1.0 servers that do support keep-alive
655 but not HTTP/1.1 automatic keep-alive. Doing this with a proxy server
656 will glitch HTTP/1.0 proxies because they do not filter it out and
657 pass it on, HTTP/1.1 says the connection should default to keep alive
658 and we expect the proxy to do this */
be4401bf
AL
659 if (Proxy.empty() == true)
660 sprintf(Buf,"GET %s HTTP/1.1\r\nHost: %s\r\nConnection: keep-alive\r\n",
a4edf53b 661 QuoteString(Uri.Path,"~").c_str(),ProperHost.c_str());
be4401bf 662 else
c1a22377
AL
663 {
664 /* Generate a cache control header if necessary. We place a max
665 cache age on index files, optionally set a no-cache directive
666 and a no-store directive for archives. */
be4401bf
AL
667 sprintf(Buf,"GET %s HTTP/1.1\r\nHost: %s\r\n",
668 Itm->Uri.c_str(),ProperHost.c_str());
3573e286
MV
669 // only generate a cache control header if we actually want to
670 // use a cache
671 if (_config->FindB("Acquire::http::No-Cache",false) == false)
c1a22377
AL
672 {
673 if (Itm->IndexFile == true)
674 sprintf(Buf+strlen(Buf),"Cache-Control: max-age=%u\r\n",
bcbe61ae 675 _config->FindI("Acquire::http::Max-Age",0));
c1a22377
AL
676 else
677 {
678 if (_config->FindB("Acquire::http::No-Store",false) == true)
679 strcat(Buf,"Cache-Control: no-store\r\n");
680 }
681 }
682 }
3573e286
MV
683 // generate a no-cache header if needed
684 if (_config->FindB("Acquire::http::No-Cache",false) == true)
685 strcat(Buf,"Cache-Control: no-cache\r\nPragma: no-cache\r\n");
686
c1a22377 687
be4401bf 688 string Req = Buf;
492f957a 689
be4401bf
AL
690 // Check for a partial file
691 struct stat SBuf;
692 if (stat(Itm->DestFile.c_str(),&SBuf) >= 0 && SBuf.st_size > 0)
693 {
694 // In this case we send an if-range query with a range header
1ae93c94 695 sprintf(Buf,"Range: bytes=%li-\r\nIf-Range: %s\r\n",(long)SBuf.st_size - 1,
be4401bf
AL
696 TimeRFC1123(SBuf.st_mtime).c_str());
697 Req += Buf;
698 }
699 else
700 {
701 if (Itm->LastModified != 0)
702 {
703 sprintf(Buf,"If-Modified-Since: %s\r\n",TimeRFC1123(Itm->LastModified).c_str());
704 Req += Buf;
705 }
706 }
707
8d64c395
AL
708 if (Proxy.User.empty() == false || Proxy.Password.empty() == false)
709 Req += string("Proxy-Authorization: Basic ") +
710 Base64Encode(Proxy.User + ":" + Proxy.Password) + "\r\n";
be4401bf 711
b2e465d6
AL
712 if (Uri.User.empty() == false || Uri.Password.empty() == false)
713 Req += string("Authorization: Basic ") +
714 Base64Encode(Uri.User + ":" + Uri.Password) + "\r\n";
715
44a38e53 716 Req += "User-Agent: Debian APT-HTTP/1.3\r\n\r\n";
c98b1307
AL
717
718 if (Debug == true)
719 cerr << Req << endl;
c1a22377 720
be4401bf
AL
721 Out.Read(Req);
722}
723 /*}}}*/
724// HttpMethod::Go - Run a single loop /*{{{*/
725// ---------------------------------------------------------------------
726/* This runs the select loop over the server FDs, Output file FDs and
727 stdin. */
728bool HttpMethod::Go(bool ToFile,ServerState *Srv)
729{
730 // Server has closed the connection
8195ae46
AL
731 if (Srv->ServerFd == -1 && (Srv->In.WriteSpace() == false ||
732 ToFile == false))
be4401bf
AL
733 return false;
734
d955fe80 735 fd_set rfds,wfds;
be4401bf
AL
736 FD_ZERO(&rfds);
737 FD_ZERO(&wfds);
be4401bf 738
e836f356
AL
739 /* Add the server. We only send more requests if the connection will
740 be persisting */
741 if (Srv->Out.WriteSpace() == true && Srv->ServerFd != -1
742 && Srv->Persistent == true)
be4401bf 743 FD_SET(Srv->ServerFd,&wfds);
e836f356 744 if (Srv->In.ReadSpace() == true && Srv->ServerFd != -1)
be4401bf
AL
745 FD_SET(Srv->ServerFd,&rfds);
746
747 // Add the file
748 int FileFD = -1;
749 if (File != 0)
750 FileFD = File->Fd();
751
752 if (Srv->In.WriteSpace() == true && ToFile == true && FileFD != -1)
753 FD_SET(FileFD,&wfds);
754
755 // Add stdin
756 FD_SET(STDIN_FILENO,&rfds);
757
be4401bf
AL
758 // Figure out the max fd
759 int MaxFd = FileFD;
760 if (MaxFd < Srv->ServerFd)
761 MaxFd = Srv->ServerFd;
8195ae46 762
be4401bf
AL
763 // Select
764 struct timeval tv;
3000ccea 765 tv.tv_sec = TimeOut;
be4401bf
AL
766 tv.tv_usec = 0;
767 int Res = 0;
d955fe80 768 if ((Res = select(MaxFd+1,&rfds,&wfds,0,&tv)) < 0)
c37b9502
AL
769 {
770 if (errno == EINTR)
771 return true;
dc738e7a 772 return _error->Errno("select",_("Select failed"));
c37b9502 773 }
be4401bf
AL
774
775 if (Res == 0)
776 {
dc738e7a 777 _error->Error(_("Connection timed out"));
be4401bf
AL
778 return ServerDie(Srv);
779 }
780
be4401bf
AL
781 // Handle server IO
782 if (Srv->ServerFd != -1 && FD_ISSET(Srv->ServerFd,&rfds))
783 {
784 errno = 0;
785 if (Srv->In.Read(Srv->ServerFd) == false)
786 return ServerDie(Srv);
787 }
788
789 if (Srv->ServerFd != -1 && FD_ISSET(Srv->ServerFd,&wfds))
790 {
791 errno = 0;
792 if (Srv->Out.Write(Srv->ServerFd) == false)
793 return ServerDie(Srv);
794 }
795
796 // Send data to the file
797 if (FileFD != -1 && FD_ISSET(FileFD,&wfds))
798 {
799 if (Srv->In.Write(FileFD) == false)
dc738e7a 800 return _error->Errno("write",_("Error writing to output file"));
be4401bf
AL
801 }
802
803 // Handle commands from APT
804 if (FD_ISSET(STDIN_FILENO,&rfds))
805 {
6920216d 806 if (Run(true) != -1)
be4401bf
AL
807 exit(100);
808 }
809
810 return true;
811}
812 /*}}}*/
813// HttpMethod::Flush - Dump the buffer into the file /*{{{*/
814// ---------------------------------------------------------------------
815/* This takes the current input buffer from the Server FD and writes it
816 into the file */
817bool HttpMethod::Flush(ServerState *Srv)
818{
819 if (File != 0)
820 {
b57c8bb4
MV
821 // on GNU/kFreeBSD, apt dies on /dev/null because non-blocking
822 // can't be set
823 if (File->Name() != "/dev/null")
824 SetNonBlock(File->Fd(),false);
be4401bf
AL
825 if (Srv->In.WriteSpace() == false)
826 return true;
827
828 while (Srv->In.WriteSpace() == true)
829 {
830 if (Srv->In.Write(File->Fd()) == false)
dc738e7a 831 return _error->Errno("write",_("Error writing to file"));
92e889c8
AL
832 if (Srv->In.IsLimit() == true)
833 return true;
be4401bf
AL
834 }
835
836 if (Srv->In.IsLimit() == true || Srv->Encoding == ServerState::Closes)
837 return true;
838 }
839 return false;
840}
841 /*}}}*/
842// HttpMethod::ServerDie - The server has closed the connection. /*{{{*/
843// ---------------------------------------------------------------------
844/* */
845bool HttpMethod::ServerDie(ServerState *Srv)
846{
2b154e53
AL
847 unsigned int LErrno = errno;
848
be4401bf
AL
849 // Dump the buffer to the file
850 if (Srv->State == ServerState::Data)
851 {
b57c8bb4
MV
852 // on GNU/kFreeBSD, apt dies on /dev/null because non-blocking
853 // can't be set
854 if (File->Name() != "/dev/null")
855 SetNonBlock(File->Fd(),false);
be4401bf
AL
856 while (Srv->In.WriteSpace() == true)
857 {
858 if (Srv->In.Write(File->Fd()) == false)
dc738e7a 859 return _error->Errno("write",_("Error writing to the file"));
92e889c8
AL
860
861 // Done
862 if (Srv->In.IsLimit() == true)
863 return true;
be4401bf
AL
864 }
865 }
866
867 // See if this is because the server finished the data stream
868 if (Srv->In.IsLimit() == false && Srv->State != ServerState::Header &&
869 Srv->Encoding != ServerState::Closes)
870 {
3d615484 871 Srv->Close();
2b154e53 872 if (LErrno == 0)
db0db9fe 873 return _error->Error(_("Error reading from server. Remote end closed connection"));
2b154e53 874 errno = LErrno;
dc738e7a 875 return _error->Errno("read",_("Error reading from server"));
be4401bf
AL
876 }
877 else
878 {
879 Srv->In.Limit(-1);
880
881 // Nothing left in the buffer
882 if (Srv->In.WriteSpace() == false)
883 return false;
884
885 // We may have got multiple responses back in one packet..
886 Srv->Close();
887 return true;
888 }
889
890 return false;
891}
892 /*}}}*/
893// HttpMethod::DealWithHeaders - Handle the retrieved header data /*{{{*/
894// ---------------------------------------------------------------------
895/* We look at the header data we got back from the server and decide what
896 to do. Returns
897 0 - File is open,
898 1 - IMS hit
92e889c8 899 3 - Unrecoverable error
94235cfb
AL
900 4 - Error with error content page
901 5 - Unrecoverable non-server error (close the connection) */
be4401bf
AL
902int HttpMethod::DealWithHeaders(FetchResult &Res,ServerState *Srv)
903{
904 // Not Modified
905 if (Srv->Result == 304)
906 {
907 unlink(Queue->DestFile.c_str());
908 Res.IMSHit = true;
909 Res.LastModified = Queue->LastModified;
910 return 1;
911 }
912
913 /* We have a reply we dont handle. This should indicate a perm server
914 failure */
915 if (Srv->Result < 200 || Srv->Result >= 300)
916 {
917 _error->Error("%u %s",Srv->Result,Srv->Code);
92e889c8
AL
918 if (Srv->HaveContent == true)
919 return 4;
be4401bf
AL
920 return 3;
921 }
922
923 // This is some sort of 2xx 'data follows' reply
924 Res.LastModified = Srv->Date;
925 Res.Size = Srv->Size;
926
927 // Open the file
928 delete File;
929 File = new FileFd(Queue->DestFile,FileFd::WriteAny);
930 if (_error->PendingError() == true)
94235cfb 931 return 5;
492f957a
AL
932
933 FailFile = Queue->DestFile;
30b30ec1 934 FailFile.c_str(); // Make sure we dont do a malloc in the signal handler
492f957a
AL
935 FailFd = File->Fd();
936 FailTime = Srv->Date;
937
be4401bf
AL
938 // Set the expected size
939 if (Srv->StartPos >= 0)
940 {
941 Res.ResumePoint = Srv->StartPos;
942 ftruncate(File->Fd(),Srv->StartPos);
943 }
944
945 // Set the start point
946 lseek(File->Fd(),0,SEEK_END);
947
63b1700f
AL
948 delete Srv->In.Hash;
949 Srv->In.Hash = new Hashes;
be4401bf 950
63b1700f 951 // Fill the Hash if the file is non-empty (resume)
be4401bf
AL
952 if (Srv->StartPos > 0)
953 {
954 lseek(File->Fd(),0,SEEK_SET);
63b1700f 955 if (Srv->In.Hash->AddFD(File->Fd(),Srv->StartPos) == false)
be4401bf 956 {
dc738e7a 957 _error->Errno("read",_("Problem hashing file"));
94235cfb 958 return 5;
be4401bf
AL
959 }
960 lseek(File->Fd(),0,SEEK_END);
961 }
962
963 SetNonBlock(File->Fd(),true);
964 return 0;
965}
966 /*}}}*/
492f957a
AL
967// HttpMethod::SigTerm - Handle a fatal signal /*{{{*/
968// ---------------------------------------------------------------------
969/* This closes and timestamps the open file. This is neccessary to get
970 resume behavoir on user abort */
971void HttpMethod::SigTerm(int)
972{
973 if (FailFd == -1)
ffe9323a 974 _exit(100);
492f957a
AL
975 close(FailFd);
976
977 // Timestamp
978 struct utimbuf UBuf;
492f957a
AL
979 UBuf.actime = FailTime;
980 UBuf.modtime = FailTime;
981 utime(FailFile.c_str(),&UBuf);
982
ffe9323a 983 _exit(100);
492f957a
AL
984}
985 /*}}}*/
5cb5d8dc
AL
986// HttpMethod::Fetch - Fetch an item /*{{{*/
987// ---------------------------------------------------------------------
988/* This adds an item to the pipeline. We keep the pipeline at a fixed
989 depth. */
990bool HttpMethod::Fetch(FetchItem *)
991{
992 if (Server == 0)
993 return true;
3000ccea 994
5cb5d8dc
AL
995 // Queue the requests
996 int Depth = -1;
997 bool Tail = false;
f93d1355
AL
998 for (FetchItem *I = Queue; I != 0 && Depth < (signed)PipelineDepth;
999 I = I->Next, Depth++)
5cb5d8dc 1000 {
f93d1355
AL
1001 // If pipelining is disabled, we only queue 1 request
1002 if (Server->Pipeline == false && Depth >= 0)
1003 break;
1004
5cb5d8dc
AL
1005 // Make sure we stick with the same server
1006 if (Server->Comp(I->Uri) == false)
1007 break;
5cb5d8dc
AL
1008 if (QueueBack == I)
1009 Tail = true;
1010 if (Tail == true)
1011 {
5cb5d8dc
AL
1012 QueueBack = I->Next;
1013 SendReq(I,Server->Out);
1014 continue;
f93d1355 1015 }
5cb5d8dc
AL
1016 }
1017
1018 return true;
1019};
1020 /*}}}*/
85f72a56
AL
1021// HttpMethod::Configuration - Handle a configuration message /*{{{*/
1022// ---------------------------------------------------------------------
1023/* We stash the desired pipeline depth */
1024bool HttpMethod::Configuration(string Message)
1025{
1026 if (pkgAcqMethod::Configuration(Message) == false)
1027 return false;
1028
30456e14
AL
1029 TimeOut = _config->FindI("Acquire::http::Timeout",TimeOut);
1030 PipelineDepth = _config->FindI("Acquire::http::Pipeline-Depth",
1031 PipelineDepth);
c98b1307 1032 Debug = _config->FindB("Debug::Acquire::http",false);
3000ccea 1033
85f72a56
AL
1034 return true;
1035}
1036 /*}}}*/
492f957a 1037// HttpMethod::Loop - Main loop /*{{{*/
be4401bf
AL
1038// ---------------------------------------------------------------------
1039/* */
1040int HttpMethod::Loop()
1041{
492f957a
AL
1042 signal(SIGTERM,SigTerm);
1043 signal(SIGINT,SigTerm);
1044
5cb5d8dc 1045 Server = 0;
be4401bf 1046
92e889c8 1047 int FailCounter = 0;
be4401bf 1048 while (1)
2b154e53 1049 {
be4401bf
AL
1050 // We have no commands, wait for some to arrive
1051 if (Queue == 0)
1052 {
1053 if (WaitFd(STDIN_FILENO) == false)
1054 return 0;
1055 }
1056
6920216d
AL
1057 /* Run messages, we can accept 0 (no message) if we didn't
1058 do a WaitFd above.. Otherwise the FD is closed. */
1059 int Result = Run(true);
1060 if (Result != -1 && (Result != 0 || Queue == 0))
be4401bf
AL
1061 return 100;
1062
1063 if (Queue == 0)
1064 continue;
1065
1066 // Connect to the server
1067 if (Server == 0 || Server->Comp(Queue->Uri) == false)
1068 {
1069 delete Server;
1070 Server = new ServerState(Queue->Uri,this);
1071 }
e836f356
AL
1072
1073 /* If the server has explicitly said this is the last connection
1074 then we pre-emptively shut down the pipeline and tear down
1075 the connection. This will speed up HTTP/1.0 servers a tad
1076 since we don't have to wait for the close sequence to
1077 complete */
1078 if (Server->Persistent == false)
1079 Server->Close();
1080
a7fb252c
AL
1081 // Reset the pipeline
1082 if (Server->ServerFd == -1)
1083 QueueBack = Queue;
1084
be4401bf
AL
1085 // Connnect to the host
1086 if (Server->Open() == false)
1087 {
43252d15 1088 Fail(true);
a1459f52
AL
1089 delete Server;
1090 Server = 0;
be4401bf
AL
1091 continue;
1092 }
be4401bf 1093
5cb5d8dc
AL
1094 // Fill the pipeline.
1095 Fetch(0);
1096
92e889c8
AL
1097 // Fetch the next URL header data from the server.
1098 switch (Server->RunHeaders())
be4401bf 1099 {
92e889c8
AL
1100 case 0:
1101 break;
1102
1103 // The header data is bad
1104 case 2:
1105 {
db0db9fe 1106 _error->Error(_("Bad header data"));
43252d15 1107 Fail(true);
b2e465d6 1108 RotateDNS();
92e889c8
AL
1109 continue;
1110 }
1111
1112 // The server closed a connection during the header get..
1113 default:
1114 case 1:
1115 {
1116 FailCounter++;
3d615484 1117 _error->Discard();
92e889c8 1118 Server->Close();
f93d1355
AL
1119 Server->Pipeline = false;
1120
2b154e53
AL
1121 if (FailCounter >= 2)
1122 {
dc738e7a 1123 Fail(_("Connection failed"),true);
2b154e53
AL
1124 FailCounter = 0;
1125 }
1126
b2e465d6 1127 RotateDNS();
92e889c8
AL
1128 continue;
1129 }
1130 };
5cb5d8dc 1131
be4401bf
AL
1132 // Decide what to do.
1133 FetchResult Res;
bfd22fc0 1134 Res.Filename = Queue->DestFile;
be4401bf
AL
1135 switch (DealWithHeaders(Res,Server))
1136 {
1137 // Ok, the file is Open
1138 case 0:
1139 {
1140 URIStart(Res);
1141
1142 // Run the data
492f957a
AL
1143 bool Result = Server->RunData();
1144
b2e465d6
AL
1145 /* If the server is sending back sizeless responses then fill in
1146 the size now */
1147 if (Res.Size == 0)
1148 Res.Size = File->Size();
1149
492f957a
AL
1150 // Close the file, destroy the FD object and timestamp it
1151 FailFd = -1;
1152 delete File;
1153 File = 0;
1154
1155 // Timestamp
1156 struct utimbuf UBuf;
1157 time(&UBuf.actime);
1158 UBuf.actime = Server->Date;
1159 UBuf.modtime = Server->Date;
1160 utime(Queue->DestFile.c_str(),&UBuf);
1161
1162 // Send status to APT
1163 if (Result == true)
92e889c8 1164 {
a7c835af 1165 Res.TakeHashes(*Server->In.Hash);
92e889c8
AL
1166 URIDone(Res);
1167 }
492f957a 1168 else
2b154e53 1169 Fail(true);
e836f356 1170
be4401bf
AL
1171 break;
1172 }
1173
1174 // IMS hit
1175 case 1:
1176 {
1177 URIDone(Res);
1178 break;
1179 }
1180
1181 // Hard server error, not found or something
1182 case 3:
1183 {
1184 Fail();
1185 break;
1186 }
94235cfb
AL
1187
1188 // Hard internal error, kill the connection and fail
1189 case 5:
1190 {
a305f593
AL
1191 delete File;
1192 File = 0;
1193
94235cfb 1194 Fail();
b2e465d6 1195 RotateDNS();
94235cfb
AL
1196 Server->Close();
1197 break;
1198 }
92e889c8
AL
1199
1200 // We need to flush the data, the header is like a 404 w/ error text
1201 case 4:
1202 {
1203 Fail();
1204
1205 // Send to content to dev/null
1206 File = new FileFd("/dev/null",FileFd::WriteExists);
1207 Server->RunData();
1208 delete File;
1209 File = 0;
1210 break;
1211 }
be4401bf
AL
1212
1213 default:
dc738e7a 1214 Fail(_("Internal error"));
be4401bf 1215 break;
92e889c8
AL
1216 }
1217
1218 FailCounter = 0;
be4401bf
AL
1219 }
1220
1221 return 0;
1222}
1223 /*}}}*/
1224
1225int main()
1226{
049c0171 1227 setlocale(LC_ALL, "");
049c0171 1228
be4401bf
AL
1229 HttpMethod Mth;
1230
1231 return Mth.Loop();
1232}
a305f593
AL
1233
1234