]> git.saurik.com Git - apt.git/blame - methods/http.cc
Add a GetListOfFilesInDir() helper method which replaces the old
[apt.git] / methods / http.cc
CommitLineData
be4401bf
AL
1// -*- mode: cpp; mode: fold -*-
2// Description /*{{{*/
2cbcabd8 3// $Id: http.cc,v 1.59 2004/05/08 19:42:35 mdz Exp $
be4401bf
AL
4/* ######################################################################
5
ae58a985 6 HTTP Acquire Method - This is the HTTP aquire method for APT.
be4401bf
AL
7
8 It uses HTTP/1.1 and many of the fancy options there-in, such as
e836f356
AL
9 pipelining, range, if-range and so on.
10
11 It is based on a doubly buffered select loop. A groupe of requests are
be4401bf
AL
12 fed into a single output buffer that is constantly fed out the
13 socket. This provides ideal pipelining as in many cases all of the
14 requests will fit into a single packet. The input socket is buffered
e836f356 15 the same way and fed into the fd for the file (may be a pipe in future).
be4401bf
AL
16
17 This double buffering provides fairly substantial transfer rates,
18 compared to wget the http method is about 4% faster. Most importantly,
19 when HTTP is compared with FTP as a protocol the speed difference is
20 huge. In tests over the internet from two sites to llug (via ATM) this
21 program got 230k/s sustained http transfer rates. FTP on the other
22 hand topped out at 170k/s. That combined with the time to setup the
23 FTP connection makes HTTP a vastly superior protocol.
24
25 ##################################################################### */
26 /*}}}*/
27// Include Files /*{{{*/
28#include <apt-pkg/fileutl.h>
29#include <apt-pkg/acquire-method.h>
30#include <apt-pkg/error.h>
63b1700f 31#include <apt-pkg/hashes.h>
592b7800 32#include <apt-pkg/netrc.h>
be4401bf
AL
33
34#include <sys/stat.h>
35#include <sys/time.h>
36#include <utime.h>
37#include <unistd.h>
492f957a 38#include <signal.h>
be4401bf 39#include <stdio.h>
65a1e968 40#include <errno.h>
42195eb2
AL
41#include <string.h>
42#include <iostream>
15d7e515 43#include <map>
d77559ac 44#include <apti18n.h>
be4401bf 45
592b7800 46
be4401bf 47// Internet stuff
0837bd25 48#include <netdb.h>
be4401bf 49
59b46c41 50#include "config.h"
0837bd25 51#include "connect.h"
934b6582 52#include "rfc2553emu.h"
be4401bf
AL
53#include "http.h"
54 /*}}}*/
42195eb2 55using namespace std;
be4401bf 56
492f957a
AL
57string HttpMethod::FailFile;
58int HttpMethod::FailFd = -1;
59time_t HttpMethod::FailTime = 0;
c37030c2 60unsigned long PipelineDepth = 10;
3000ccea 61unsigned long TimeOut = 120;
15d7e515 62bool AllowRedirect = false;
c98b1307 63bool Debug = false;
c37030c2 64URI Proxy;
492f957a 65
7c6e2dc7
MV
66unsigned long CircleBuf::BwReadLimit=0;
67unsigned long CircleBuf::BwTickReadData=0;
68struct timeval CircleBuf::BwReadTick={0,0};
69const unsigned int CircleBuf::BW_HZ=10;
70
be4401bf
AL
71// CircleBuf::CircleBuf - Circular input buffer /*{{{*/
72// ---------------------------------------------------------------------
73/* */
63b1700f 74CircleBuf::CircleBuf(unsigned long Size) : Size(Size), Hash(0)
be4401bf
AL
75{
76 Buf = new unsigned char[Size];
77 Reset();
7c6e2dc7
MV
78
79 CircleBuf::BwReadLimit = _config->FindI("Acquire::http::Dl-Limit",0)*1024;
be4401bf
AL
80}
81 /*}}}*/
82// CircleBuf::Reset - Reset to the default state /*{{{*/
83// ---------------------------------------------------------------------
84/* */
85void CircleBuf::Reset()
86{
87 InP = 0;
88 OutP = 0;
89 StrPos = 0;
90 MaxGet = (unsigned int)-1;
91 OutQueue = string();
63b1700f 92 if (Hash != 0)
be4401bf 93 {
63b1700f
AL
94 delete Hash;
95 Hash = new Hashes;
be4401bf
AL
96 }
97};
98 /*}}}*/
99// CircleBuf::Read - Read from a FD into the circular buffer /*{{{*/
100// ---------------------------------------------------------------------
101/* This fills up the buffer with as much data as is in the FD, assuming it
102 is non-blocking.. */
103bool CircleBuf::Read(int Fd)
104{
7c6e2dc7
MV
105 unsigned long BwReadMax;
106
be4401bf
AL
107 while (1)
108 {
109 // Woops, buffer is full
110 if (InP - OutP == Size)
111 return true;
7c6e2dc7
MV
112
113 // what's left to read in this tick
114 BwReadMax = CircleBuf::BwReadLimit/BW_HZ;
115
116 if(CircleBuf::BwReadLimit) {
117 struct timeval now;
118 gettimeofday(&now,0);
119
120 unsigned long d = (now.tv_sec-CircleBuf::BwReadTick.tv_sec)*1000000 +
121 now.tv_usec-CircleBuf::BwReadTick.tv_usec;
122 if(d > 1000000/BW_HZ) {
123 CircleBuf::BwReadTick = now;
124 CircleBuf::BwTickReadData = 0;
125 }
126
127 if(CircleBuf::BwTickReadData >= BwReadMax) {
128 usleep(1000000/BW_HZ);
129 return true;
130 }
131 }
132
be4401bf
AL
133 // Write the buffer segment
134 int Res;
7c6e2dc7
MV
135 if(CircleBuf::BwReadLimit) {
136 Res = read(Fd,Buf + (InP%Size),
137 BwReadMax > LeftRead() ? LeftRead() : BwReadMax);
138 } else
139 Res = read(Fd,Buf + (InP%Size),LeftRead());
be4401bf 140
7c6e2dc7
MV
141 if(Res > 0 && BwReadLimit > 0)
142 CircleBuf::BwTickReadData += Res;
143
be4401bf
AL
144 if (Res == 0)
145 return false;
146 if (Res < 0)
147 {
148 if (errno == EAGAIN)
149 return true;
150 return false;
151 }
152
153 if (InP == 0)
154 gettimeofday(&Start,0);
155 InP += Res;
156 }
157}
158 /*}}}*/
159// CircleBuf::Read - Put the string into the buffer /*{{{*/
160// ---------------------------------------------------------------------
161/* This will hold the string in and fill the buffer with it as it empties */
162bool CircleBuf::Read(string Data)
163{
164 OutQueue += Data;
165 FillOut();
166 return true;
167}
168 /*}}}*/
169// CircleBuf::FillOut - Fill the buffer from the output queue /*{{{*/
170// ---------------------------------------------------------------------
171/* */
172void CircleBuf::FillOut()
173{
174 if (OutQueue.empty() == true)
175 return;
176 while (1)
177 {
178 // Woops, buffer is full
179 if (InP - OutP == Size)
180 return;
181
182 // Write the buffer segment
183 unsigned long Sz = LeftRead();
184 if (OutQueue.length() - StrPos < Sz)
185 Sz = OutQueue.length() - StrPos;
42195eb2 186 memcpy(Buf + (InP%Size),OutQueue.c_str() + StrPos,Sz);
be4401bf
AL
187
188 // Advance
189 StrPos += Sz;
190 InP += Sz;
191 if (OutQueue.length() == StrPos)
192 {
193 StrPos = 0;
194 OutQueue = "";
195 return;
196 }
197 }
198}
199 /*}}}*/
200// CircleBuf::Write - Write from the buffer into a FD /*{{{*/
201// ---------------------------------------------------------------------
202/* This empties the buffer into the FD. */
203bool CircleBuf::Write(int Fd)
204{
205 while (1)
206 {
207 FillOut();
208
209 // Woops, buffer is empty
210 if (OutP == InP)
211 return true;
212
213 if (OutP == MaxGet)
214 return true;
215
216 // Write the buffer segment
217 int Res;
218 Res = write(Fd,Buf + (OutP%Size),LeftWrite());
219
220 if (Res == 0)
221 return false;
222 if (Res < 0)
223 {
224 if (errno == EAGAIN)
225 return true;
226
227 return false;
228 }
229
63b1700f
AL
230 if (Hash != 0)
231 Hash->Add(Buf + (OutP%Size),Res);
be4401bf
AL
232
233 OutP += Res;
234 }
235}
236 /*}}}*/
237// CircleBuf::WriteTillEl - Write from the buffer to a string /*{{{*/
238// ---------------------------------------------------------------------
239/* This copies till the first empty line */
240bool CircleBuf::WriteTillEl(string &Data,bool Single)
241{
242 // We cheat and assume it is unneeded to have more than one buffer load
243 for (unsigned long I = OutP; I < InP; I++)
244 {
245 if (Buf[I%Size] != '\n')
246 continue;
2cbcabd8 247 ++I;
be4401bf
AL
248
249 if (Single == false)
250 {
2cbcabd8
AL
251 if (I < InP && Buf[I%Size] == '\r')
252 ++I;
927c393f
MV
253 if (I >= InP || Buf[I%Size] != '\n')
254 continue;
255 ++I;
be4401bf
AL
256 }
257
be4401bf
AL
258 Data = "";
259 while (OutP < I)
260 {
261 unsigned long Sz = LeftWrite();
262 if (Sz == 0)
263 return false;
927c393f 264 if (I - OutP < Sz)
be4401bf
AL
265 Sz = I - OutP;
266 Data += string((char *)(Buf + (OutP%Size)),Sz);
267 OutP += Sz;
268 }
269 return true;
270 }
271 return false;
272}
273 /*}}}*/
274// CircleBuf::Stats - Print out stats information /*{{{*/
275// ---------------------------------------------------------------------
276/* */
277void CircleBuf::Stats()
278{
279 if (InP == 0)
280 return;
281
282 struct timeval Stop;
283 gettimeofday(&Stop,0);
284/* float Diff = Stop.tv_sec - Start.tv_sec +
285 (float)(Stop.tv_usec - Start.tv_usec)/1000000;
286 clog << "Got " << InP << " in " << Diff << " at " << InP/Diff << endl;*/
287}
288 /*}}}*/
289
290// ServerState::ServerState - Constructor /*{{{*/
291// ---------------------------------------------------------------------
292/* */
293ServerState::ServerState(URI Srv,HttpMethod *Owner) : Owner(Owner),
3000ccea 294 In(64*1024), Out(4*1024),
be4401bf
AL
295 ServerName(Srv)
296{
297 Reset();
298}
299 /*}}}*/
300// ServerState::Open - Open a connection to the server /*{{{*/
301// ---------------------------------------------------------------------
302/* This opens a connection to the server. */
be4401bf
AL
303bool ServerState::Open()
304{
92e889c8
AL
305 // Use the already open connection if possible.
306 if (ServerFd != -1)
307 return true;
308
be4401bf 309 Close();
492f957a
AL
310 In.Reset();
311 Out.Reset();
e836f356
AL
312 Persistent = true;
313
492f957a 314 // Determine the proxy setting
788a8f42
EL
315 string SpecificProxy = _config->Find("Acquire::http::Proxy::" + ServerName.Host);
316 if (!SpecificProxy.empty())
492f957a 317 {
788a8f42
EL
318 if (SpecificProxy == "DIRECT")
319 Proxy = "";
320 else
321 Proxy = SpecificProxy;
352c2768 322 }
492f957a 323 else
788a8f42
EL
324 {
325 string DefProxy = _config->Find("Acquire::http::Proxy");
326 if (!DefProxy.empty())
327 {
328 Proxy = DefProxy;
329 }
330 else
331 {
332 char* result = getenv("http_proxy");
333 Proxy = result ? result : "";
334 }
335 }
352c2768 336
f8081133 337 // Parse no_proxy, a , separated list of domains
9e2a06ff
AL
338 if (getenv("no_proxy") != 0)
339 {
f8081133
AL
340 if (CheckDomainList(ServerName.Host,getenv("no_proxy")) == true)
341 Proxy = "";
342 }
343
492f957a 344 // Determine what host and port to use based on the proxy settings
934b6582 345 int Port = 0;
492f957a 346 string Host;
dd1fd92b 347 if (Proxy.empty() == true || Proxy.Host.empty() == true)
be4401bf 348 {
92e889c8
AL
349 if (ServerName.Port != 0)
350 Port = ServerName.Port;
be4401bf
AL
351 Host = ServerName.Host;
352 }
353 else
354 {
92e889c8
AL
355 if (Proxy.Port != 0)
356 Port = Proxy.Port;
be4401bf
AL
357 Host = Proxy.Host;
358 }
359
0837bd25 360 // Connect to the remote server
9505213b 361 if (Connect(Host,Port,"http",80,ServerFd,TimeOut,Owner) == false)
0837bd25 362 return false;
3000ccea 363
be4401bf
AL
364 return true;
365}
366 /*}}}*/
367// ServerState::Close - Close a connection to the server /*{{{*/
368// ---------------------------------------------------------------------
369/* */
370bool ServerState::Close()
371{
372 close(ServerFd);
373 ServerFd = -1;
be4401bf
AL
374 return true;
375}
376 /*}}}*/
377// ServerState::RunHeaders - Get the headers before the data /*{{{*/
378// ---------------------------------------------------------------------
38965a34
MV
379/* Returns 0 if things are OK, 1 if an IO error occurred and 2 if a header
380 parse error occurred */
92e889c8 381int ServerState::RunHeaders()
be4401bf
AL
382{
383 State = Header;
384
519c5591 385 Owner->Status(_("Waiting for headers"));
be4401bf
AL
386
387 Major = 0;
388 Minor = 0;
389 Result = 0;
390 Size = 0;
391 StartPos = 0;
92e889c8
AL
392 Encoding = Closes;
393 HaveContent = false;
be4401bf
AL
394 time(&Date);
395
396 do
397 {
398 string Data;
399 if (In.WriteTillEl(Data) == false)
400 continue;
9d95e726
AL
401
402 if (Debug == true)
403 clog << Data;
be4401bf
AL
404
405 for (string::const_iterator I = Data.begin(); I < Data.end(); I++)
406 {
407 string::const_iterator J = I;
408 for (; J != Data.end() && *J != '\n' && *J != '\r';J++);
42195eb2 409 if (HeaderLine(string(I,J)) == false)
92e889c8 410 return 2;
be4401bf
AL
411 I = J;
412 }
e836f356 413
b2e465d6
AL
414 // 100 Continue is a Nop...
415 if (Result == 100)
416 continue;
417
e836f356
AL
418 // Tidy up the connection persistance state.
419 if (Encoding == Closes && HaveContent == true)
420 Persistent = false;
421
92e889c8 422 return 0;
be4401bf
AL
423 }
424 while (Owner->Go(false,this) == true);
e836f356 425
92e889c8 426 return 1;
be4401bf
AL
427}
428 /*}}}*/
429// ServerState::RunData - Transfer the data from the socket /*{{{*/
430// ---------------------------------------------------------------------
431/* */
432bool ServerState::RunData()
433{
434 State = Data;
435
436 // Chunked transfer encoding is fun..
437 if (Encoding == Chunked)
438 {
439 while (1)
440 {
441 // Grab the block size
442 bool Last = true;
443 string Data;
444 In.Limit(-1);
445 do
446 {
447 if (In.WriteTillEl(Data,true) == true)
448 break;
449 }
450 while ((Last = Owner->Go(false,this)) == true);
451
452 if (Last == false)
453 return false;
454
455 // See if we are done
456 unsigned long Len = strtol(Data.c_str(),0,16);
457 if (Len == 0)
458 {
459 In.Limit(-1);
460
461 // We have to remove the entity trailer
462 Last = true;
463 do
464 {
465 if (In.WriteTillEl(Data,true) == true && Data.length() <= 2)
466 break;
467 }
468 while ((Last = Owner->Go(false,this)) == true);
469 if (Last == false)
470 return false;
e1b96638 471 return !_error->PendingError();
be4401bf
AL
472 }
473
474 // Transfer the block
475 In.Limit(Len);
476 while (Owner->Go(true,this) == true)
477 if (In.IsLimit() == true)
478 break;
479
480 // Error
481 if (In.IsLimit() == false)
482 return false;
483
484 // The server sends an extra new line before the next block specifier..
485 In.Limit(-1);
486 Last = true;
487 do
488 {
489 if (In.WriteTillEl(Data,true) == true)
490 break;
491 }
492 while ((Last = Owner->Go(false,this)) == true);
493 if (Last == false)
494 return false;
92e889c8 495 }
be4401bf
AL
496 }
497 else
498 {
499 /* Closes encoding is used when the server did not specify a size, the
500 loss of the connection means we are done */
501 if (Encoding == Closes)
502 In.Limit(-1);
503 else
504 In.Limit(Size - StartPos);
505
506 // Just transfer the whole block.
507 do
508 {
509 if (In.IsLimit() == false)
510 continue;
511
512 In.Limit(-1);
e1b96638 513 return !_error->PendingError();
be4401bf
AL
514 }
515 while (Owner->Go(true,this) == true);
516 }
517
e1b96638 518 return Owner->Flush(this) && !_error->PendingError();
be4401bf
AL
519}
520 /*}}}*/
521// ServerState::HeaderLine - Process a header line /*{{{*/
522// ---------------------------------------------------------------------
523/* */
524bool ServerState::HeaderLine(string Line)
525{
526 if (Line.empty() == true)
527 return true;
30456e14 528
be4401bf
AL
529 // The http server might be trying to do something evil.
530 if (Line.length() >= MAXLEN)
dc738e7a 531 return _error->Error(_("Got a single header line over %u chars"),MAXLEN);
be4401bf
AL
532
533 string::size_type Pos = Line.find(' ');
534 if (Pos == string::npos || Pos+1 > Line.length())
c901051d
AL
535 {
536 // Blah, some servers use "connection:closes", evil.
537 Pos = Line.find(':');
538 if (Pos == string::npos || Pos + 2 > Line.length())
dc738e7a 539 return _error->Error(_("Bad header line"));
c901051d
AL
540 Pos++;
541 }
be4401bf 542
c901051d
AL
543 // Parse off any trailing spaces between the : and the next word.
544 string::size_type Pos2 = Pos;
545 while (Pos2 < Line.length() && isspace(Line[Pos2]) != 0)
546 Pos2++;
547
548 string Tag = string(Line,0,Pos);
549 string Val = string(Line,Pos2);
550
42195eb2 551 if (stringcasecmp(Tag.c_str(),Tag.c_str()+4,"HTTP") == 0)
be4401bf
AL
552 {
553 // Evil servers return no version
554 if (Line[4] == '/')
555 {
dda7233c 556 if (sscanf(Line.c_str(),"HTTP/%u.%u %u%[^\n]",&Major,&Minor,
be4401bf 557 &Result,Code) != 4)
db0db9fe 558 return _error->Error(_("The HTTP server sent an invalid reply header"));
be4401bf
AL
559 }
560 else
561 {
562 Major = 0;
563 Minor = 9;
dda7233c 564 if (sscanf(Line.c_str(),"HTTP %u%[^\n]",&Result,Code) != 2)
db0db9fe 565 return _error->Error(_("The HTTP server sent an invalid reply header"));
be4401bf 566 }
e836f356
AL
567
568 /* Check the HTTP response header to get the default persistance
569 state. */
570 if (Major < 1)
571 Persistent = false;
572 else
573 {
574 if (Major == 1 && Minor <= 0)
575 Persistent = false;
576 else
577 Persistent = true;
578 }
b2e465d6 579
be4401bf
AL
580 return true;
581 }
582
92e889c8 583 if (stringcasecmp(Tag,"Content-Length:") == 0)
be4401bf
AL
584 {
585 if (Encoding == Closes)
586 Encoding = Stream;
92e889c8 587 HaveContent = true;
be4401bf
AL
588
589 // The length is already set from the Content-Range header
590 if (StartPos != 0)
591 return true;
592
593 if (sscanf(Val.c_str(),"%lu",&Size) != 1)
db0db9fe 594 return _error->Error(_("The HTTP server sent an invalid Content-Length header"));
be4401bf
AL
595 return true;
596 }
597
92e889c8
AL
598 if (stringcasecmp(Tag,"Content-Type:") == 0)
599 {
600 HaveContent = true;
601 return true;
602 }
603
604 if (stringcasecmp(Tag,"Content-Range:") == 0)
be4401bf 605 {
92e889c8
AL
606 HaveContent = true;
607
be4401bf 608 if (sscanf(Val.c_str(),"bytes %lu-%*u/%lu",&StartPos,&Size) != 2)
db0db9fe 609 return _error->Error(_("The HTTP server sent an invalid Content-Range header"));
be4401bf 610 if ((unsigned)StartPos > Size)
db0db9fe 611 return _error->Error(_("This HTTP server has broken range support"));
be4401bf
AL
612 return true;
613 }
614
92e889c8 615 if (stringcasecmp(Tag,"Transfer-Encoding:") == 0)
be4401bf 616 {
92e889c8
AL
617 HaveContent = true;
618 if (stringcasecmp(Val,"chunked") == 0)
e836f356 619 Encoding = Chunked;
be4401bf
AL
620 return true;
621 }
622
e836f356
AL
623 if (stringcasecmp(Tag,"Connection:") == 0)
624 {
625 if (stringcasecmp(Val,"close") == 0)
626 Persistent = false;
627 if (stringcasecmp(Val,"keep-alive") == 0)
628 Persistent = true;
629 return true;
630 }
631
92e889c8 632 if (stringcasecmp(Tag,"Last-Modified:") == 0)
be4401bf
AL
633 {
634 if (StrToTime(Val,Date) == false)
dc738e7a 635 return _error->Error(_("Unknown date format"));
be4401bf
AL
636 return true;
637 }
638
15d7e515
MV
639 if (stringcasecmp(Tag,"Location:") == 0)
640 {
641 Location = Val;
642 return true;
643 }
644
be4401bf
AL
645 return true;
646}
647 /*}}}*/
648
649// HttpMethod::SendReq - Send the HTTP request /*{{{*/
650// ---------------------------------------------------------------------
651/* This places the http request in the outbound buffer */
652void HttpMethod::SendReq(FetchItem *Itm,CircleBuf &Out)
653{
654 URI Uri = Itm->Uri;
c1a22377 655
be4401bf 656 // The HTTP server expects a hostname with a trailing :port
c1a22377 657 char Buf[1000];
be4401bf
AL
658 string ProperHost = Uri.Host;
659 if (Uri.Port != 0)
660 {
661 sprintf(Buf,":%u",Uri.Port);
662 ProperHost += Buf;
663 }
664
c1a22377
AL
665 // Just in case.
666 if (Itm->Uri.length() >= sizeof(Buf))
667 abort();
668
492f957a
AL
669 /* Build the request. We include a keep-alive header only for non-proxy
670 requests. This is to tweak old http/1.0 servers that do support keep-alive
671 but not HTTP/1.1 automatic keep-alive. Doing this with a proxy server
672 will glitch HTTP/1.0 proxies because they do not filter it out and
673 pass it on, HTTP/1.1 says the connection should default to keep alive
674 and we expect the proxy to do this */
02b7ddb1 675 if (Proxy.empty() == true || Proxy.Host.empty())
be4401bf 676 sprintf(Buf,"GET %s HTTP/1.1\r\nHost: %s\r\nConnection: keep-alive\r\n",
a4edf53b 677 QuoteString(Uri.Path,"~").c_str(),ProperHost.c_str());
be4401bf 678 else
c1a22377
AL
679 {
680 /* Generate a cache control header if necessary. We place a max
681 cache age on index files, optionally set a no-cache directive
682 and a no-store directive for archives. */
be4401bf
AL
683 sprintf(Buf,"GET %s HTTP/1.1\r\nHost: %s\r\n",
684 Itm->Uri.c_str(),ProperHost.c_str());
106e6740
MV
685 // only generate a cache control header if we actually want to
686 // use a cache
687 if (_config->FindB("Acquire::http::No-Cache",false) == false)
c1a22377
AL
688 {
689 if (Itm->IndexFile == true)
690 sprintf(Buf+strlen(Buf),"Cache-Control: max-age=%u\r\n",
bcbe61ae 691 _config->FindI("Acquire::http::Max-Age",0));
c1a22377
AL
692 else
693 {
694 if (_config->FindB("Acquire::http::No-Store",false) == true)
695 strcat(Buf,"Cache-Control: no-store\r\n");
696 }
697 }
698 }
106e6740
MV
699 // generate a no-cache header if needed
700 if (_config->FindB("Acquire::http::No-Cache",false) == true)
701 strcat(Buf,"Cache-Control: no-cache\r\nPragma: no-cache\r\n");
702
c1a22377 703
be4401bf 704 string Req = Buf;
492f957a 705
be4401bf
AL
706 // Check for a partial file
707 struct stat SBuf;
708 if (stat(Itm->DestFile.c_str(),&SBuf) >= 0 && SBuf.st_size > 0)
709 {
710 // In this case we send an if-range query with a range header
1ae93c94 711 sprintf(Buf,"Range: bytes=%li-\r\nIf-Range: %s\r\n",(long)SBuf.st_size - 1,
be4401bf
AL
712 TimeRFC1123(SBuf.st_mtime).c_str());
713 Req += Buf;
714 }
715 else
716 {
717 if (Itm->LastModified != 0)
718 {
719 sprintf(Buf,"If-Modified-Since: %s\r\n",TimeRFC1123(Itm->LastModified).c_str());
720 Req += Buf;
721 }
722 }
723
8d64c395
AL
724 if (Proxy.User.empty() == false || Proxy.Password.empty() == false)
725 Req += string("Proxy-Authorization: Basic ") +
726 Base64Encode(Proxy.User + ":" + Proxy.Password) + "\r\n";
be4401bf 727
1de1f703 728 maybe_add_auth (Uri, _config->FindFile("Dir::Etc::netrc"));
b2e465d6 729 if (Uri.User.empty() == false || Uri.Password.empty() == false)
592b7800 730 {
b2e465d6
AL
731 Req += string("Authorization: Basic ") +
732 Base64Encode(Uri.User + ":" + Uri.Password) + "\r\n";
592b7800 733 }
4494239c
DK
734 Req += "User-Agent: " + _config->Find("Acquire::http::User-Agent",
735 "Debian APT-HTTP/1.3 ("VERSION")") + "\r\n\r\n";
c98b1307
AL
736
737 if (Debug == true)
738 cerr << Req << endl;
c1a22377 739
be4401bf
AL
740 Out.Read(Req);
741}
742 /*}}}*/
743// HttpMethod::Go - Run a single loop /*{{{*/
744// ---------------------------------------------------------------------
745/* This runs the select loop over the server FDs, Output file FDs and
746 stdin. */
747bool HttpMethod::Go(bool ToFile,ServerState *Srv)
748{
749 // Server has closed the connection
8195ae46
AL
750 if (Srv->ServerFd == -1 && (Srv->In.WriteSpace() == false ||
751 ToFile == false))
be4401bf
AL
752 return false;
753
d955fe80 754 fd_set rfds,wfds;
be4401bf
AL
755 FD_ZERO(&rfds);
756 FD_ZERO(&wfds);
be4401bf 757
e836f356
AL
758 /* Add the server. We only send more requests if the connection will
759 be persisting */
760 if (Srv->Out.WriteSpace() == true && Srv->ServerFd != -1
761 && Srv->Persistent == true)
be4401bf 762 FD_SET(Srv->ServerFd,&wfds);
e836f356 763 if (Srv->In.ReadSpace() == true && Srv->ServerFd != -1)
be4401bf
AL
764 FD_SET(Srv->ServerFd,&rfds);
765
766 // Add the file
767 int FileFD = -1;
768 if (File != 0)
769 FileFD = File->Fd();
770
771 if (Srv->In.WriteSpace() == true && ToFile == true && FileFD != -1)
772 FD_SET(FileFD,&wfds);
773
774 // Add stdin
775 FD_SET(STDIN_FILENO,&rfds);
776
be4401bf
AL
777 // Figure out the max fd
778 int MaxFd = FileFD;
779 if (MaxFd < Srv->ServerFd)
780 MaxFd = Srv->ServerFd;
8195ae46 781
be4401bf
AL
782 // Select
783 struct timeval tv;
3000ccea 784 tv.tv_sec = TimeOut;
be4401bf
AL
785 tv.tv_usec = 0;
786 int Res = 0;
d955fe80 787 if ((Res = select(MaxFd+1,&rfds,&wfds,0,&tv)) < 0)
c37b9502
AL
788 {
789 if (errno == EINTR)
790 return true;
dc738e7a 791 return _error->Errno("select",_("Select failed"));
c37b9502 792 }
be4401bf
AL
793
794 if (Res == 0)
795 {
dc738e7a 796 _error->Error(_("Connection timed out"));
be4401bf
AL
797 return ServerDie(Srv);
798 }
799
be4401bf
AL
800 // Handle server IO
801 if (Srv->ServerFd != -1 && FD_ISSET(Srv->ServerFd,&rfds))
802 {
803 errno = 0;
804 if (Srv->In.Read(Srv->ServerFd) == false)
805 return ServerDie(Srv);
806 }
807
808 if (Srv->ServerFd != -1 && FD_ISSET(Srv->ServerFd,&wfds))
809 {
810 errno = 0;
811 if (Srv->Out.Write(Srv->ServerFd) == false)
812 return ServerDie(Srv);
813 }
814
815 // Send data to the file
816 if (FileFD != -1 && FD_ISSET(FileFD,&wfds))
817 {
818 if (Srv->In.Write(FileFD) == false)
dc738e7a 819 return _error->Errno("write",_("Error writing to output file"));
be4401bf
AL
820 }
821
822 // Handle commands from APT
823 if (FD_ISSET(STDIN_FILENO,&rfds))
824 {
6920216d 825 if (Run(true) != -1)
be4401bf
AL
826 exit(100);
827 }
828
829 return true;
830}
831 /*}}}*/
832// HttpMethod::Flush - Dump the buffer into the file /*{{{*/
833// ---------------------------------------------------------------------
834/* This takes the current input buffer from the Server FD and writes it
835 into the file */
836bool HttpMethod::Flush(ServerState *Srv)
837{
838 if (File != 0)
839 {
b57c8bb4
MV
840 // on GNU/kFreeBSD, apt dies on /dev/null because non-blocking
841 // can't be set
842 if (File->Name() != "/dev/null")
843 SetNonBlock(File->Fd(),false);
be4401bf
AL
844 if (Srv->In.WriteSpace() == false)
845 return true;
846
847 while (Srv->In.WriteSpace() == true)
848 {
849 if (Srv->In.Write(File->Fd()) == false)
dc738e7a 850 return _error->Errno("write",_("Error writing to file"));
92e889c8
AL
851 if (Srv->In.IsLimit() == true)
852 return true;
be4401bf
AL
853 }
854
855 if (Srv->In.IsLimit() == true || Srv->Encoding == ServerState::Closes)
856 return true;
857 }
858 return false;
859}
860 /*}}}*/
861// HttpMethod::ServerDie - The server has closed the connection. /*{{{*/
862// ---------------------------------------------------------------------
863/* */
864bool HttpMethod::ServerDie(ServerState *Srv)
865{
2b154e53
AL
866 unsigned int LErrno = errno;
867
be4401bf
AL
868 // Dump the buffer to the file
869 if (Srv->State == ServerState::Data)
870 {
b57c8bb4
MV
871 // on GNU/kFreeBSD, apt dies on /dev/null because non-blocking
872 // can't be set
873 if (File->Name() != "/dev/null")
874 SetNonBlock(File->Fd(),false);
be4401bf
AL
875 while (Srv->In.WriteSpace() == true)
876 {
877 if (Srv->In.Write(File->Fd()) == false)
dc738e7a 878 return _error->Errno("write",_("Error writing to the file"));
92e889c8
AL
879
880 // Done
881 if (Srv->In.IsLimit() == true)
882 return true;
be4401bf
AL
883 }
884 }
885
886 // See if this is because the server finished the data stream
887 if (Srv->In.IsLimit() == false && Srv->State != ServerState::Header &&
888 Srv->Encoding != ServerState::Closes)
889 {
3d615484 890 Srv->Close();
2b154e53 891 if (LErrno == 0)
db0db9fe 892 return _error->Error(_("Error reading from server. Remote end closed connection"));
2b154e53 893 errno = LErrno;
dc738e7a 894 return _error->Errno("read",_("Error reading from server"));
be4401bf
AL
895 }
896 else
897 {
898 Srv->In.Limit(-1);
899
900 // Nothing left in the buffer
901 if (Srv->In.WriteSpace() == false)
902 return false;
903
904 // We may have got multiple responses back in one packet..
905 Srv->Close();
906 return true;
907 }
908
909 return false;
910}
911 /*}}}*/
912// HttpMethod::DealWithHeaders - Handle the retrieved header data /*{{{*/
913// ---------------------------------------------------------------------
914/* We look at the header data we got back from the server and decide what
915 to do. Returns
916 0 - File is open,
917 1 - IMS hit
92e889c8 918 3 - Unrecoverable error
94235cfb 919 4 - Error with error content page
15d7e515
MV
920 5 - Unrecoverable non-server error (close the connection)
921 6 - Try again with a new or changed URI
922 */
be4401bf
AL
923int HttpMethod::DealWithHeaders(FetchResult &Res,ServerState *Srv)
924{
925 // Not Modified
926 if (Srv->Result == 304)
927 {
928 unlink(Queue->DestFile.c_str());
929 Res.IMSHit = true;
930 Res.LastModified = Queue->LastModified;
931 return 1;
932 }
933
15d7e515
MV
934 /* Redirect
935 *
936 * Note that it is only OK for us to treat all redirection the same
937 * because we *always* use GET, not other HTTP methods. There are
938 * three redirection codes for which it is not appropriate that we
939 * redirect. Pass on those codes so the error handling kicks in.
940 */
941 if (AllowRedirect
942 && (Srv->Result > 300 && Srv->Result < 400)
943 && (Srv->Result != 300 // Multiple Choices
944 && Srv->Result != 304 // Not Modified
945 && Srv->Result != 306)) // (Not part of HTTP/1.1, reserved)
946 {
947 if (!Srv->Location.empty())
948 {
949 NextURI = Srv->Location;
950 return 6;
951 }
952 /* else pass through for error message */
953 }
954
be4401bf
AL
955 /* We have a reply we dont handle. This should indicate a perm server
956 failure */
957 if (Srv->Result < 200 || Srv->Result >= 300)
958 {
959 _error->Error("%u %s",Srv->Result,Srv->Code);
92e889c8
AL
960 if (Srv->HaveContent == true)
961 return 4;
be4401bf
AL
962 return 3;
963 }
964
965 // This is some sort of 2xx 'data follows' reply
966 Res.LastModified = Srv->Date;
967 Res.Size = Srv->Size;
968
969 // Open the file
970 delete File;
971 File = new FileFd(Queue->DestFile,FileFd::WriteAny);
972 if (_error->PendingError() == true)
94235cfb 973 return 5;
492f957a
AL
974
975 FailFile = Queue->DestFile;
30b30ec1 976 FailFile.c_str(); // Make sure we dont do a malloc in the signal handler
492f957a
AL
977 FailFd = File->Fd();
978 FailTime = Srv->Date;
979
be4401bf
AL
980 // Set the expected size
981 if (Srv->StartPos >= 0)
982 {
983 Res.ResumePoint = Srv->StartPos;
9b5d79ec
MV
984 if (ftruncate(File->Fd(),Srv->StartPos) < 0)
985 _error->Errno("ftruncate", _("Failed to truncate file"));
be4401bf
AL
986 }
987
988 // Set the start point
989 lseek(File->Fd(),0,SEEK_END);
990
63b1700f
AL
991 delete Srv->In.Hash;
992 Srv->In.Hash = new Hashes;
be4401bf 993
63b1700f 994 // Fill the Hash if the file is non-empty (resume)
be4401bf
AL
995 if (Srv->StartPos > 0)
996 {
997 lseek(File->Fd(),0,SEEK_SET);
63b1700f 998 if (Srv->In.Hash->AddFD(File->Fd(),Srv->StartPos) == false)
be4401bf 999 {
dc738e7a 1000 _error->Errno("read",_("Problem hashing file"));
94235cfb 1001 return 5;
be4401bf
AL
1002 }
1003 lseek(File->Fd(),0,SEEK_END);
1004 }
1005
1006 SetNonBlock(File->Fd(),true);
1007 return 0;
1008}
1009 /*}}}*/
492f957a
AL
1010// HttpMethod::SigTerm - Handle a fatal signal /*{{{*/
1011// ---------------------------------------------------------------------
1012/* This closes and timestamps the open file. This is neccessary to get
1013 resume behavoir on user abort */
1014void HttpMethod::SigTerm(int)
1015{
1016 if (FailFd == -1)
ffe9323a 1017 _exit(100);
492f957a
AL
1018 close(FailFd);
1019
1020 // Timestamp
1021 struct utimbuf UBuf;
492f957a
AL
1022 UBuf.actime = FailTime;
1023 UBuf.modtime = FailTime;
1024 utime(FailFile.c_str(),&UBuf);
1025
ffe9323a 1026 _exit(100);
492f957a
AL
1027}
1028 /*}}}*/
5cb5d8dc
AL
1029// HttpMethod::Fetch - Fetch an item /*{{{*/
1030// ---------------------------------------------------------------------
1031/* This adds an item to the pipeline. We keep the pipeline at a fixed
1032 depth. */
1033bool HttpMethod::Fetch(FetchItem *)
1034{
1035 if (Server == 0)
1036 return true;
3000ccea 1037
5cb5d8dc
AL
1038 // Queue the requests
1039 int Depth = -1;
f93d1355
AL
1040 for (FetchItem *I = Queue; I != 0 && Depth < (signed)PipelineDepth;
1041 I = I->Next, Depth++)
5cb5d8dc 1042 {
f93d1355
AL
1043 // If pipelining is disabled, we only queue 1 request
1044 if (Server->Pipeline == false && Depth >= 0)
1045 break;
1046
5cb5d8dc
AL
1047 // Make sure we stick with the same server
1048 if (Server->Comp(I->Uri) == false)
1049 break;
5cb5d8dc 1050 if (QueueBack == I)
5cb5d8dc 1051 {
5cb5d8dc
AL
1052 QueueBack = I->Next;
1053 SendReq(I,Server->Out);
1054 continue;
f93d1355 1055 }
5cb5d8dc
AL
1056 }
1057
1058 return true;
1059};
1060 /*}}}*/
85f72a56
AL
1061// HttpMethod::Configuration - Handle a configuration message /*{{{*/
1062// ---------------------------------------------------------------------
1063/* We stash the desired pipeline depth */
1064bool HttpMethod::Configuration(string Message)
1065{
1066 if (pkgAcqMethod::Configuration(Message) == false)
1067 return false;
1068
15d7e515 1069 AllowRedirect = _config->FindB("Acquire::http::AllowRedirect",true);
30456e14
AL
1070 TimeOut = _config->FindI("Acquire::http::Timeout",TimeOut);
1071 PipelineDepth = _config->FindI("Acquire::http::Pipeline-Depth",
1072 PipelineDepth);
c98b1307 1073 Debug = _config->FindB("Debug::Acquire::http",false);
3000ccea 1074
85f72a56
AL
1075 return true;
1076}
1077 /*}}}*/
492f957a 1078// HttpMethod::Loop - Main loop /*{{{*/
be4401bf
AL
1079// ---------------------------------------------------------------------
1080/* */
1081int HttpMethod::Loop()
1082{
15d7e515
MV
1083 typedef vector<string> StringVector;
1084 typedef vector<string>::iterator StringVectorIterator;
1085 map<string, StringVector> Redirected;
1086
492f957a
AL
1087 signal(SIGTERM,SigTerm);
1088 signal(SIGINT,SigTerm);
1089
5cb5d8dc 1090 Server = 0;
be4401bf 1091
92e889c8 1092 int FailCounter = 0;
be4401bf 1093 while (1)
2b154e53 1094 {
be4401bf
AL
1095 // We have no commands, wait for some to arrive
1096 if (Queue == 0)
1097 {
1098 if (WaitFd(STDIN_FILENO) == false)
1099 return 0;
1100 }
1101
6920216d
AL
1102 /* Run messages, we can accept 0 (no message) if we didn't
1103 do a WaitFd above.. Otherwise the FD is closed. */
1104 int Result = Run(true);
1105 if (Result != -1 && (Result != 0 || Queue == 0))
be4401bf
AL
1106 return 100;
1107
1108 if (Queue == 0)
1109 continue;
1110
1111 // Connect to the server
1112 if (Server == 0 || Server->Comp(Queue->Uri) == false)
1113 {
1114 delete Server;
1115 Server = new ServerState(Queue->Uri,this);
1116 }
e836f356
AL
1117 /* If the server has explicitly said this is the last connection
1118 then we pre-emptively shut down the pipeline and tear down
1119 the connection. This will speed up HTTP/1.0 servers a tad
1120 since we don't have to wait for the close sequence to
1121 complete */
1122 if (Server->Persistent == false)
1123 Server->Close();
1124
a7fb252c
AL
1125 // Reset the pipeline
1126 if (Server->ServerFd == -1)
1127 QueueBack = Queue;
1128
be4401bf
AL
1129 // Connnect to the host
1130 if (Server->Open() == false)
1131 {
43252d15 1132 Fail(true);
a1459f52
AL
1133 delete Server;
1134 Server = 0;
be4401bf
AL
1135 continue;
1136 }
be4401bf 1137
5cb5d8dc
AL
1138 // Fill the pipeline.
1139 Fetch(0);
1140
92e889c8
AL
1141 // Fetch the next URL header data from the server.
1142 switch (Server->RunHeaders())
be4401bf 1143 {
92e889c8
AL
1144 case 0:
1145 break;
1146
1147 // The header data is bad
1148 case 2:
1149 {
db0db9fe 1150 _error->Error(_("Bad header data"));
43252d15 1151 Fail(true);
b2e465d6 1152 RotateDNS();
92e889c8
AL
1153 continue;
1154 }
1155
1156 // The server closed a connection during the header get..
1157 default:
1158 case 1:
1159 {
1160 FailCounter++;
3d615484 1161 _error->Discard();
92e889c8 1162 Server->Close();
f93d1355
AL
1163 Server->Pipeline = false;
1164
2b154e53
AL
1165 if (FailCounter >= 2)
1166 {
dc738e7a 1167 Fail(_("Connection failed"),true);
2b154e53
AL
1168 FailCounter = 0;
1169 }
1170
b2e465d6 1171 RotateDNS();
92e889c8
AL
1172 continue;
1173 }
1174 };
5cb5d8dc 1175
be4401bf
AL
1176 // Decide what to do.
1177 FetchResult Res;
bfd22fc0 1178 Res.Filename = Queue->DestFile;
be4401bf
AL
1179 switch (DealWithHeaders(Res,Server))
1180 {
1181 // Ok, the file is Open
1182 case 0:
1183 {
1184 URIStart(Res);
1185
1186 // Run the data
492f957a
AL
1187 bool Result = Server->RunData();
1188
b2e465d6
AL
1189 /* If the server is sending back sizeless responses then fill in
1190 the size now */
1191 if (Res.Size == 0)
1192 Res.Size = File->Size();
1193
492f957a
AL
1194 // Close the file, destroy the FD object and timestamp it
1195 FailFd = -1;
1196 delete File;
1197 File = 0;
1198
1199 // Timestamp
1200 struct utimbuf UBuf;
1201 time(&UBuf.actime);
1202 UBuf.actime = Server->Date;
1203 UBuf.modtime = Server->Date;
1204 utime(Queue->DestFile.c_str(),&UBuf);
1205
1206 // Send status to APT
1207 if (Result == true)
92e889c8 1208 {
a7c835af 1209 Res.TakeHashes(*Server->In.Hash);
92e889c8
AL
1210 URIDone(Res);
1211 }
492f957a 1212 else
82d0afc2
MV
1213 {
1214 if (Server->ServerFd == -1)
1215 {
1216 FailCounter++;
1217 _error->Discard();
1218 Server->Close();
1219
1220 if (FailCounter >= 2)
9a52beaa 1221 {
82d0afc2
MV
1222 Fail(_("Connection failed"),true);
1223 FailCounter = 0;
9a52beaa 1224 }
82d0afc2
MV
1225
1226 QueueBack = Queue;
1227 }
1228 else
1229 Fail(true);
1230 }
be4401bf
AL
1231 break;
1232 }
1233
1234 // IMS hit
1235 case 1:
1236 {
1237 URIDone(Res);
1238 break;
1239 }
1240
1241 // Hard server error, not found or something
1242 case 3:
1243 {
1244 Fail();
1245 break;
1246 }
94235cfb
AL
1247
1248 // Hard internal error, kill the connection and fail
1249 case 5:
1250 {
a305f593
AL
1251 delete File;
1252 File = 0;
1253
94235cfb 1254 Fail();
b2e465d6 1255 RotateDNS();
94235cfb
AL
1256 Server->Close();
1257 break;
1258 }
92e889c8
AL
1259
1260 // We need to flush the data, the header is like a 404 w/ error text
1261 case 4:
1262 {
1263 Fail();
1264
1265 // Send to content to dev/null
1266 File = new FileFd("/dev/null",FileFd::WriteExists);
1267 Server->RunData();
1268 delete File;
1269 File = 0;
1270 break;
1271 }
be4401bf 1272
15d7e515
MV
1273 // Try again with a new URL
1274 case 6:
1275 {
1276 // Clear rest of response if there is content
1277 if (Server->HaveContent)
1278 {
1279 File = new FileFd("/dev/null",FileFd::WriteExists);
1280 Server->RunData();
1281 delete File;
1282 File = 0;
1283 }
1284
1285 /* Detect redirect loops. No more redirects are allowed
1286 after the same URI is seen twice in a queue item. */
1287 StringVector &R = Redirected[Queue->DestFile];
1288 bool StopRedirects = false;
1289 if (R.size() == 0)
1290 R.push_back(Queue->Uri);
1291 else if (R[0] == "STOP" || R.size() > 10)
1292 StopRedirects = true;
1293 else
1294 {
1295 for (StringVectorIterator I = R.begin(); I != R.end(); I++)
1296 if (Queue->Uri == *I)
1297 {
1298 R[0] = "STOP";
1299 break;
1300 }
1301
1302 R.push_back(Queue->Uri);
1303 }
1304
1305 if (StopRedirects == false)
1306 Redirect(NextURI);
1307 else
1308 Fail();
1309
1310 break;
1311 }
1312
be4401bf 1313 default:
dc738e7a 1314 Fail(_("Internal error"));
be4401bf 1315 break;
92e889c8
AL
1316 }
1317
1318 FailCounter = 0;
be4401bf
AL
1319 }
1320
1321 return 0;
1322}
1323 /*}}}*/
1324
1325int main()
1326{
049c0171 1327 setlocale(LC_ALL, "");
ab7f4d7c
MV
1328 // ignore SIGPIPE, this can happen on write() if the socket
1329 // closes the connection (this is dealt with via ServerDie())
1330 signal(SIGPIPE, SIG_IGN);
049c0171 1331
be4401bf 1332 HttpMethod Mth;
be4401bf
AL
1333 return Mth.Loop();
1334}
a305f593
AL
1335
1336