]>
git.saurik.com Git - apt.git/blob - methods/http.cc
1 // -*- mode: cpp; mode: fold -*-
3 // $Id: http.cc,v 1.59 2004/05/08 19:42:35 mdz Exp $
4 /* ######################################################################
6 HTTP Acquire Method - This is the HTTP acquire method for APT.
8 It uses HTTP/1.1 and many of the fancy options there-in, such as
9 pipelining, range, if-range and so on.
11 It is based on a doubly buffered select loop. A groupe of requests are
12 fed into a single output buffer that is constantly fed out the
13 socket. This provides ideal pipelining as in many cases all of the
14 requests will fit into a single packet. The input socket is buffered
15 the same way and fed into the fd for the file (may be a pipe in future).
17 This double buffering provides fairly substantial transfer rates,
18 compared to wget the http method is about 4% faster. Most importantly,
19 when HTTP is compared with FTP as a protocol the speed difference is
20 huge. In tests over the internet from two sites to llug (via ATM) this
21 program got 230k/s sustained http transfer rates. FTP on the other
22 hand topped out at 170k/s. That combined with the time to setup the
23 FTP connection makes HTTP a vastly superior protocol.
25 ##################################################################### */
27 // Include Files /*{{{*/
30 #include <apt-pkg/fileutl.h>
31 #include <apt-pkg/configuration.h>
32 #include <apt-pkg/error.h>
33 #include <apt-pkg/hashes.h>
34 #include <apt-pkg/netrc.h>
35 #include <apt-pkg/strutl.h>
36 #include <apt-pkg/proxy.h>
40 #include <sys/select.h>
58 unsigned long long CircleBuf::BwReadLimit
=0;
59 unsigned long long CircleBuf::BwTickReadData
=0;
60 struct timeval
CircleBuf::BwReadTick
={0,0};
61 const unsigned int CircleBuf::BW_HZ
=10;
63 // CircleBuf::CircleBuf - Circular input buffer /*{{{*/
64 // ---------------------------------------------------------------------
66 CircleBuf::CircleBuf(unsigned long long Size
)
67 : Size(Size
), Hash(NULL
), TotalWriten(0)
69 Buf
= new unsigned char[Size
];
72 CircleBuf::BwReadLimit
= _config
->FindI("Acquire::http::Dl-Limit",0)*1024;
75 // CircleBuf::Reset - Reset to the default state /*{{{*/
76 // ---------------------------------------------------------------------
78 void CircleBuf::Reset()
84 MaxGet
= (unsigned long long)-1;
93 // CircleBuf::Read - Read from a FD into the circular buffer /*{{{*/
94 // ---------------------------------------------------------------------
95 /* This fills up the buffer with as much data as is in the FD, assuming it
97 bool CircleBuf::Read(int Fd
)
101 // Woops, buffer is full
102 if (InP
- OutP
== Size
)
105 // what's left to read in this tick
106 unsigned long long const BwReadMax
= CircleBuf::BwReadLimit
/BW_HZ
;
108 if(CircleBuf::BwReadLimit
) {
110 gettimeofday(&now
,0);
112 unsigned long long d
= (now
.tv_sec
-CircleBuf::BwReadTick
.tv_sec
)*1000000 +
113 now
.tv_usec
-CircleBuf::BwReadTick
.tv_usec
;
114 if(d
> 1000000/BW_HZ
) {
115 CircleBuf::BwReadTick
= now
;
116 CircleBuf::BwTickReadData
= 0;
119 if(CircleBuf::BwTickReadData
>= BwReadMax
) {
120 usleep(1000000/BW_HZ
);
125 // Write the buffer segment
127 if(CircleBuf::BwReadLimit
) {
128 Res
= read(Fd
,Buf
+ (InP%Size
),
129 BwReadMax
> LeftRead() ? LeftRead() : BwReadMax
);
131 Res
= read(Fd
,Buf
+ (InP%Size
),LeftRead());
133 if(Res
> 0 && BwReadLimit
> 0)
134 CircleBuf::BwTickReadData
+= Res
;
146 gettimeofday(&Start
,0);
151 // CircleBuf::Read - Put the string into the buffer /*{{{*/
152 // ---------------------------------------------------------------------
153 /* This will hold the string in and fill the buffer with it as it empties */
154 bool CircleBuf::Read(string Data
)
161 // CircleBuf::FillOut - Fill the buffer from the output queue /*{{{*/
162 // ---------------------------------------------------------------------
164 void CircleBuf::FillOut()
166 if (OutQueue
.empty() == true)
170 // Woops, buffer is full
171 if (InP
- OutP
== Size
)
174 // Write the buffer segment
175 unsigned long long Sz
= LeftRead();
176 if (OutQueue
.length() - StrPos
< Sz
)
177 Sz
= OutQueue
.length() - StrPos
;
178 memcpy(Buf
+ (InP%Size
),OutQueue
.c_str() + StrPos
,Sz
);
183 if (OutQueue
.length() == StrPos
)
192 // CircleBuf::Write - Write from the buffer into a FD /*{{{*/
193 // ---------------------------------------------------------------------
194 /* This empties the buffer into the FD. */
195 bool CircleBuf::Write(int Fd
)
201 // Woops, buffer is empty
208 // Write the buffer segment
210 Res
= write(Fd
,Buf
+ (OutP%Size
),LeftWrite());
225 Hash
->Add(Buf
+ (OutP%Size
),Res
);
231 // CircleBuf::WriteTillEl - Write from the buffer to a string /*{{{*/
232 // ---------------------------------------------------------------------
233 /* This copies till the first empty line */
234 bool CircleBuf::WriteTillEl(string
&Data
,bool Single
)
236 // We cheat and assume it is unneeded to have more than one buffer load
237 for (unsigned long long I
= OutP
; I
< InP
; I
++)
239 if (Buf
[I%Size
] != '\n')
245 if (I
< InP
&& Buf
[I%Size
] == '\r')
247 if (I
>= InP
|| Buf
[I%Size
] != '\n')
255 unsigned long long Sz
= LeftWrite();
260 Data
+= string((char *)(Buf
+ (OutP%Size
)),Sz
);
268 // CircleBuf::Stats - Print out stats information /*{{{*/
269 // ---------------------------------------------------------------------
271 void CircleBuf::Stats()
277 gettimeofday(&Stop
,0);
278 /* float Diff = Stop.tv_sec - Start.tv_sec +
279 (float)(Stop.tv_usec - Start.tv_usec)/1000000;
280 clog << "Got " << InP << " in " << Diff << " at " << InP/Diff << endl;*/
283 CircleBuf::~CircleBuf()
289 // HttpServerState::HttpServerState - Constructor /*{{{*/
290 HttpServerState::HttpServerState(URI Srv
,HttpMethod
*Owner
) : ServerState(Srv
, Owner
), In(64*1024), Out(4*1024)
292 TimeOut
= _config
->FindI("Acquire::http::Timeout",TimeOut
);
296 // HttpServerState::Open - Open a connection to the server /*{{{*/
297 // ---------------------------------------------------------------------
298 /* This opens a connection to the server. */
299 bool HttpServerState::Open()
301 // Use the already open connection if possible.
310 // Determine the proxy setting
311 AutoDetectProxy(ServerName
);
312 string SpecificProxy
= _config
->Find("Acquire::http::Proxy::" + ServerName
.Host
);
313 if (!SpecificProxy
.empty())
315 if (SpecificProxy
== "DIRECT")
318 Proxy
= SpecificProxy
;
322 string DefProxy
= _config
->Find("Acquire::http::Proxy");
323 if (!DefProxy
.empty())
329 char* result
= getenv("http_proxy");
330 Proxy
= result
? result
: "";
334 // Parse no_proxy, a , separated list of domains
335 if (getenv("no_proxy") != 0)
337 if (CheckDomainList(ServerName
.Host
,getenv("no_proxy")) == true)
341 // Determine what host and port to use based on the proxy settings
344 if (Proxy
.empty() == true || Proxy
.Host
.empty() == true)
346 if (ServerName
.Port
!= 0)
347 Port
= ServerName
.Port
;
348 Host
= ServerName
.Host
;
350 else if (Proxy
.Access
!= "http")
351 return _error
->Error("Unsupported proxy configured: %s", URI::SiteOnly(Proxy
).c_str());
359 // Connect to the remote server
360 if (Connect(Host
,Port
,"http",80,ServerFd
,TimeOut
,Owner
) == false)
366 // HttpServerState::Close - Close a connection to the server /*{{{*/
367 // ---------------------------------------------------------------------
369 bool HttpServerState::Close()
376 // HttpServerState::RunData - Transfer the data from the socket /*{{{*/
377 bool HttpServerState::RunData(FileFd
* const File
)
381 // Chunked transfer encoding is fun..
382 if (Encoding
== Chunked
)
386 // Grab the block size
392 if (In
.WriteTillEl(Data
,true) == true)
395 while ((Last
= Go(false, File
)) == true);
400 // See if we are done
401 unsigned long long Len
= strtoull(Data
.c_str(),0,16);
406 // We have to remove the entity trailer
410 if (In
.WriteTillEl(Data
,true) == true && Data
.length() <= 2)
413 while ((Last
= Go(false, File
)) == true);
416 return !_error
->PendingError();
419 // Transfer the block
421 while (Go(true, File
) == true)
422 if (In
.IsLimit() == true)
426 if (In
.IsLimit() == false)
429 // The server sends an extra new line before the next block specifier..
434 if (In
.WriteTillEl(Data
,true) == true)
437 while ((Last
= Go(false, File
)) == true);
444 /* Closes encoding is used when the server did not specify a size, the
445 loss of the connection means we are done */
448 else if (DownloadSize
!= 0)
449 In
.Limit(DownloadSize
);
450 else if (Persistent
== false)
453 // Just transfer the whole block.
456 if (In
.IsLimit() == false)
460 return !_error
->PendingError();
462 while (Go(true, File
) == true);
465 return Owner
->Flush() && !_error
->PendingError();
468 bool HttpServerState::RunDataToDevNull() /*{{{*/
470 FileFd
DevNull("/dev/null", FileFd::WriteOnly
);
471 return RunData(&DevNull
);
474 bool HttpServerState::ReadHeaderLines(std::string
&Data
) /*{{{*/
476 return In
.WriteTillEl(Data
);
479 bool HttpServerState::LoadNextResponse(bool const ToFile
, FileFd
* const File
)/*{{{*/
481 return Go(ToFile
, File
);
484 bool HttpServerState::WriteResponse(const std::string
&Data
) /*{{{*/
486 return Out
.Read(Data
);
489 APT_PURE
bool HttpServerState::IsOpen() /*{{{*/
491 return (ServerFd
!= -1);
494 bool HttpServerState::InitHashes(HashStringList
const &ExpectedHashes
) /*{{{*/
497 In
.Hash
= new Hashes(ExpectedHashes
);
502 APT_PURE Hashes
* HttpServerState::GetHashes() /*{{{*/
507 // HttpServerState::Die - The server has closed the connection. /*{{{*/
508 bool HttpServerState::Die(FileFd
* const File
)
510 unsigned int LErrno
= errno
;
512 // Dump the buffer to the file
513 if (State
== ServerState::Data
)
517 // on GNU/kFreeBSD, apt dies on /dev/null because non-blocking
519 if (File
->Name() != "/dev/null")
520 SetNonBlock(File
->Fd(),false);
521 while (In
.WriteSpace() == true)
523 if (In
.Write(File
->Fd()) == false)
524 return _error
->Errno("write",_("Error writing to the file"));
527 if (In
.IsLimit() == true)
532 // See if this is because the server finished the data stream
533 if (In
.IsLimit() == false && State
!= HttpServerState::Header
&&
538 return _error
->Error(_("Error reading from server. Remote end closed connection"));
540 return _error
->Errno("read",_("Error reading from server"));
546 // Nothing left in the buffer
547 if (In
.WriteSpace() == false)
550 // We may have got multiple responses back in one packet..
558 // HttpServerState::Flush - Dump the buffer into the file /*{{{*/
559 // ---------------------------------------------------------------------
560 /* This takes the current input buffer from the Server FD and writes it
562 bool HttpServerState::Flush(FileFd
* const File
)
566 // on GNU/kFreeBSD, apt dies on /dev/null because non-blocking
568 if (File
->Name() != "/dev/null")
569 SetNonBlock(File
->Fd(),false);
570 if (In
.WriteSpace() == false)
573 while (In
.WriteSpace() == true)
575 if (In
.Write(File
->Fd()) == false)
576 return _error
->Errno("write",_("Error writing to file"));
577 if (In
.IsLimit() == true)
581 if (In
.IsLimit() == true || Persistent
== false)
587 // HttpServerState::Go - Run a single loop /*{{{*/
588 // ---------------------------------------------------------------------
589 /* This runs the select loop over the server FDs, Output file FDs and
591 bool HttpServerState::Go(bool ToFile
, FileFd
* const File
)
593 // Server has closed the connection
594 if (ServerFd
== -1 && (In
.WriteSpace() == false ||
602 /* Add the server. We only send more requests if the connection will
604 if (Out
.WriteSpace() == true && ServerFd
!= -1
605 && Persistent
== true)
606 FD_SET(ServerFd
,&wfds
);
607 if (In
.ReadSpace() == true && ServerFd
!= -1)
608 FD_SET(ServerFd
,&rfds
);
615 if (In
.WriteSpace() == true && ToFile
== true && FileFD
!= -1)
616 FD_SET(FileFD
,&wfds
);
619 if (_config
->FindB("Acquire::http::DependOnSTDIN", true) == true)
620 FD_SET(STDIN_FILENO
,&rfds
);
622 // Figure out the max fd
624 if (MaxFd
< ServerFd
)
632 if ((Res
= select(MaxFd
+1,&rfds
,&wfds
,0,&tv
)) < 0)
636 return _error
->Errno("select",_("Select failed"));
641 _error
->Error(_("Connection timed out"));
646 if (ServerFd
!= -1 && FD_ISSET(ServerFd
,&rfds
))
649 if (In
.Read(ServerFd
) == false)
653 if (ServerFd
!= -1 && FD_ISSET(ServerFd
,&wfds
))
656 if (Out
.Write(ServerFd
) == false)
660 // Send data to the file
661 if (FileFD
!= -1 && FD_ISSET(FileFD
,&wfds
))
663 if (In
.Write(FileFD
) == false)
664 return _error
->Errno("write",_("Error writing to output file"));
667 if (MaximumSize
> 0 && File
&& File
->Tell() > MaximumSize
)
669 Owner
->SetFailReason("MaximumSizeExceeded");
670 return _error
->Error("Writing more data than expected (%llu > %llu)",
671 File
->Tell(), MaximumSize
);
674 // Handle commands from APT
675 if (FD_ISSET(STDIN_FILENO
,&rfds
))
677 if (Owner
->Run(true) != -1)
685 // HttpMethod::SendReq - Send the HTTP request /*{{{*/
686 // ---------------------------------------------------------------------
687 /* This places the http request in the outbound buffer */
688 void HttpMethod::SendReq(FetchItem
*Itm
)
692 // The HTTP server expects a hostname with a trailing :port
693 std::stringstream Req
;
696 if (Uri
.Host
.find(':') != string::npos
)
697 ProperHost
= '[' + Uri
.Host
+ ']';
699 ProperHost
= Uri
.Host
;
701 /* RFC 2616 ยง5.1.2 requires absolute URIs for requests to proxies,
702 but while its a must for all servers to accept absolute URIs,
703 it is assumed clients will sent an absolute path for non-proxies */
704 std::string requesturi
;
705 if (Server
->Proxy
.empty() == true || Server
->Proxy
.Host
.empty())
706 requesturi
= Uri
.Path
;
708 requesturi
= Itm
->Uri
;
710 // The "+" is encoded as a workaround for a amazon S3 bug
711 // see LP bugs #1003633 and #1086997.
712 requesturi
= QuoteString(requesturi
, "+~ ");
714 /* Build the request. No keep-alive is included as it is the default
715 in 1.1, can cause problems with proxies, and we are an HTTP/1.1
717 C.f. https://tools.ietf.org/wg/httpbis/trac/ticket/158 */
718 Req
<< "GET " << requesturi
<< " HTTP/1.1\r\n";
720 Req
<< "Host: " << ProperHost
<< ":" << std::to_string(Uri
.Port
) << "\r\n";
722 Req
<< "Host: " << ProperHost
<< "\r\n";
724 // generate a cache control header (if needed)
725 if (_config
->FindB("Acquire::http::No-Cache",false) == true)
726 Req
<< "Cache-Control: no-cache\r\n"
727 << "Pragma: no-cache\r\n";
728 else if (Itm
->IndexFile
== true)
729 Req
<< "Cache-Control: max-age=" << std::to_string(_config
->FindI("Acquire::http::Max-Age",0)) << "\r\n";
730 else if (_config
->FindB("Acquire::http::No-Store",false) == true)
731 Req
<< "Cache-Control: no-store\r\n";
733 // If we ask for uncompressed files servers might respond with content-
734 // negotiation which lets us end up with compressed files we do not support,
735 // see 657029, 657560 and co, so if we have no extension on the request
736 // ask for text only. As a sidenote: If there is nothing to negotate servers
737 // seem to be nice and ignore it.
738 if (_config
->FindB("Acquire::http::SendAccept", true) == true)
740 size_t const filepos
= Itm
->Uri
.find_last_of('/');
741 string
const file
= Itm
->Uri
.substr(filepos
+ 1);
742 if (flExtension(file
) == file
)
743 Req
<< "Accept: text/*\r\n";
746 // Check for a partial file and send if-queries accordingly
748 if (stat(Itm
->DestFile
.c_str(),&SBuf
) >= 0 && SBuf
.st_size
> 0)
749 Req
<< "Range: bytes=" << std::to_string(SBuf
.st_size
) << "-\r\n"
750 << "If-Range: " << TimeRFC1123(SBuf
.st_mtime
, false) << "\r\n";
751 else if (Itm
->LastModified
!= 0)
752 Req
<< "If-Modified-Since: " << TimeRFC1123(Itm
->LastModified
, false).c_str() << "\r\n";
754 if (Server
->Proxy
.User
.empty() == false || Server
->Proxy
.Password
.empty() == false)
755 Req
<< "Proxy-Authorization: Basic "
756 << Base64Encode(Server
->Proxy
.User
+ ":" + Server
->Proxy
.Password
) << "\r\n";
758 maybe_add_auth (Uri
, _config
->FindFile("Dir::Etc::netrc"));
759 if (Uri
.User
.empty() == false || Uri
.Password
.empty() == false)
760 Req
<< "Authorization: Basic "
761 << Base64Encode(Uri
.User
+ ":" + Uri
.Password
) << "\r\n";
763 Req
<< "User-Agent: " << _config
->Find("Acquire::http::User-Agent",
764 "Debian APT-HTTP/1.3 (" PACKAGE_VERSION
")") << "\r\n";
769 cerr
<< Req
.str() << endl
;
771 Server
->WriteResponse(Req
.str());
774 // HttpMethod::Configuration - Handle a configuration message /*{{{*/
775 // ---------------------------------------------------------------------
776 /* We stash the desired pipeline depth */
777 bool HttpMethod::Configuration(string Message
)
779 if (ServerMethod::Configuration(Message
) == false)
782 AllowRedirect
= _config
->FindB("Acquire::http::AllowRedirect",true);
783 PipelineDepth
= _config
->FindI("Acquire::http::Pipeline-Depth",
785 Debug
= _config
->FindB("Debug::Acquire::http",false);
790 std::unique_ptr
<ServerState
> HttpMethod::CreateServerState(URI
const &uri
)/*{{{*/
792 return std::unique_ptr
<ServerState
>(new HttpServerState(uri
, this));
795 void HttpMethod::RotateDNS() /*{{{*/