]>
git.saurik.com Git - apt.git/blob - methods/http.cc
1 // -*- mode: cpp; mode: fold -*-
3 // $Id: http.cc,v 1.59 2004/05/08 19:42:35 mdz Exp $
4 /* ######################################################################
6 HTTP Acquire Method - This is the HTTP aquire method for APT.
8 It uses HTTP/1.1 and many of the fancy options there-in, such as
9 pipelining, range, if-range and so on.
11 It is based on a doubly buffered select loop. A groupe of requests are
12 fed into a single output buffer that is constantly fed out the
13 socket. This provides ideal pipelining as in many cases all of the
14 requests will fit into a single packet. The input socket is buffered
15 the same way and fed into the fd for the file (may be a pipe in future).
17 This double buffering provides fairly substantial transfer rates,
18 compared to wget the http method is about 4% faster. Most importantly,
19 when HTTP is compared with FTP as a protocol the speed difference is
20 huge. In tests over the internet from two sites to llug (via ATM) this
21 program got 230k/s sustained http transfer rates. FTP on the other
22 hand topped out at 170k/s. That combined with the time to setup the
23 FTP connection makes HTTP a vastly superior protocol.
25 ##################################################################### */
27 // Include Files /*{{{*/
30 #include <apt-pkg/fileutl.h>
31 #include <apt-pkg/acquire-method.h>
32 #include <apt-pkg/configuration.h>
33 #include <apt-pkg/error.h>
34 #include <apt-pkg/hashes.h>
35 #include <apt-pkg/netrc.h>
54 #include "rfc2553emu.h"
61 unsigned long long CircleBuf::BwReadLimit
=0;
62 unsigned long long CircleBuf::BwTickReadData
=0;
63 struct timeval
CircleBuf::BwReadTick
={0,0};
64 const unsigned int CircleBuf::BW_HZ
=10;
66 // CircleBuf::CircleBuf - Circular input buffer /*{{{*/
67 // ---------------------------------------------------------------------
69 CircleBuf::CircleBuf(unsigned long long Size
) : Size(Size
), Hash(0)
71 Buf
= new unsigned char[Size
];
74 CircleBuf::BwReadLimit
= _config
->FindI("Acquire::http::Dl-Limit",0)*1024;
77 // CircleBuf::Reset - Reset to the default state /*{{{*/
78 // ---------------------------------------------------------------------
80 void CircleBuf::Reset()
85 MaxGet
= (unsigned long long)-1;
94 // CircleBuf::Read - Read from a FD into the circular buffer /*{{{*/
95 // ---------------------------------------------------------------------
96 /* This fills up the buffer with as much data as is in the FD, assuming it
98 bool CircleBuf::Read(int Fd
)
102 // Woops, buffer is full
103 if (InP
- OutP
== Size
)
106 // what's left to read in this tick
107 unsigned long long const BwReadMax
= CircleBuf::BwReadLimit
/BW_HZ
;
109 if(CircleBuf::BwReadLimit
) {
111 gettimeofday(&now
,0);
113 unsigned long long d
= (now
.tv_sec
-CircleBuf::BwReadTick
.tv_sec
)*1000000 +
114 now
.tv_usec
-CircleBuf::BwReadTick
.tv_usec
;
115 if(d
> 1000000/BW_HZ
) {
116 CircleBuf::BwReadTick
= now
;
117 CircleBuf::BwTickReadData
= 0;
120 if(CircleBuf::BwTickReadData
>= BwReadMax
) {
121 usleep(1000000/BW_HZ
);
126 // Write the buffer segment
128 if(CircleBuf::BwReadLimit
) {
129 Res
= read(Fd
,Buf
+ (InP%Size
),
130 BwReadMax
> LeftRead() ? LeftRead() : BwReadMax
);
132 Res
= read(Fd
,Buf
+ (InP%Size
),LeftRead());
134 if(Res
> 0 && BwReadLimit
> 0)
135 CircleBuf::BwTickReadData
+= Res
;
147 gettimeofday(&Start
,0);
152 // CircleBuf::Read - Put the string into the buffer /*{{{*/
153 // ---------------------------------------------------------------------
154 /* This will hold the string in and fill the buffer with it as it empties */
155 bool CircleBuf::Read(string Data
)
162 // CircleBuf::FillOut - Fill the buffer from the output queue /*{{{*/
163 // ---------------------------------------------------------------------
165 void CircleBuf::FillOut()
167 if (OutQueue
.empty() == true)
171 // Woops, buffer is full
172 if (InP
- OutP
== Size
)
175 // Write the buffer segment
176 unsigned long long Sz
= LeftRead();
177 if (OutQueue
.length() - StrPos
< Sz
)
178 Sz
= OutQueue
.length() - StrPos
;
179 memcpy(Buf
+ (InP%Size
),OutQueue
.c_str() + StrPos
,Sz
);
184 if (OutQueue
.length() == StrPos
)
193 // CircleBuf::Write - Write from the buffer into a FD /*{{{*/
194 // ---------------------------------------------------------------------
195 /* This empties the buffer into the FD. */
196 bool CircleBuf::Write(int Fd
)
202 // Woops, buffer is empty
209 // Write the buffer segment
211 Res
= write(Fd
,Buf
+ (OutP%Size
),LeftWrite());
224 Hash
->Add(Buf
+ (OutP%Size
),Res
);
230 // CircleBuf::WriteTillEl - Write from the buffer to a string /*{{{*/
231 // ---------------------------------------------------------------------
232 /* This copies till the first empty line */
233 bool CircleBuf::WriteTillEl(string
&Data
,bool Single
)
235 // We cheat and assume it is unneeded to have more than one buffer load
236 for (unsigned long long I
= OutP
; I
< InP
; I
++)
238 if (Buf
[I%Size
] != '\n')
244 if (I
< InP
&& Buf
[I%Size
] == '\r')
246 if (I
>= InP
|| Buf
[I%Size
] != '\n')
254 unsigned long long Sz
= LeftWrite();
259 Data
+= string((char *)(Buf
+ (OutP%Size
)),Sz
);
267 // CircleBuf::Stats - Print out stats information /*{{{*/
268 // ---------------------------------------------------------------------
270 void CircleBuf::Stats()
276 gettimeofday(&Stop
,0);
277 /* float Diff = Stop.tv_sec - Start.tv_sec +
278 (float)(Stop.tv_usec - Start.tv_usec)/1000000;
279 clog << "Got " << InP << " in " << Diff << " at " << InP/Diff << endl;*/
282 CircleBuf::~CircleBuf()
288 // HttpServerState::HttpServerState - Constructor /*{{{*/
289 HttpServerState::HttpServerState(URI Srv
,HttpMethod
*Owner
) : ServerState(Srv
, Owner
), In(64*1024), Out(4*1024)
291 TimeOut
= _config
->FindI("Acquire::http::Timeout",TimeOut
);
295 // HttpServerState::Open - Open a connection to the server /*{{{*/
296 // ---------------------------------------------------------------------
297 /* This opens a connection to the server. */
298 bool HttpServerState::Open()
300 // Use the already open connection if possible.
309 // Determine the proxy setting
310 string SpecificProxy
= _config
->Find("Acquire::http::Proxy::" + ServerName
.Host
);
311 if (!SpecificProxy
.empty())
313 if (SpecificProxy
== "DIRECT")
316 Proxy
= SpecificProxy
;
320 string DefProxy
= _config
->Find("Acquire::http::Proxy");
321 if (!DefProxy
.empty())
327 char* result
= getenv("http_proxy");
328 Proxy
= result
? result
: "";
332 // Parse no_proxy, a , separated list of domains
333 if (getenv("no_proxy") != 0)
335 if (CheckDomainList(ServerName
.Host
,getenv("no_proxy")) == true)
339 // Determine what host and port to use based on the proxy settings
342 if (Proxy
.empty() == true || Proxy
.Host
.empty() == true)
344 if (ServerName
.Port
!= 0)
345 Port
= ServerName
.Port
;
346 Host
= ServerName
.Host
;
355 // Connect to the remote server
356 if (Connect(Host
,Port
,"http",80,ServerFd
,TimeOut
,Owner
) == false)
362 // HttpServerState::Close - Close a connection to the server /*{{{*/
363 // ---------------------------------------------------------------------
365 bool HttpServerState::Close()
372 // HttpServerState::RunData - Transfer the data from the socket /*{{{*/
373 bool HttpServerState::RunData(FileFd
* const File
)
377 // Chunked transfer encoding is fun..
378 if (Encoding
== Chunked
)
382 // Grab the block size
388 if (In
.WriteTillEl(Data
,true) == true)
391 while ((Last
= Go(false, File
)) == true);
396 // See if we are done
397 unsigned long long Len
= strtoull(Data
.c_str(),0,16);
402 // We have to remove the entity trailer
406 if (In
.WriteTillEl(Data
,true) == true && Data
.length() <= 2)
409 while ((Last
= Go(false, File
)) == true);
412 return !_error
->PendingError();
415 // Transfer the block
417 while (Go(true, File
) == true)
418 if (In
.IsLimit() == true)
422 if (In
.IsLimit() == false)
425 // The server sends an extra new line before the next block specifier..
430 if (In
.WriteTillEl(Data
,true) == true)
433 while ((Last
= Go(false, File
)) == true);
440 /* Closes encoding is used when the server did not specify a size, the
441 loss of the connection means we are done */
442 if (Encoding
== Closes
)
445 In
.Limit(Size
- StartPos
);
447 // Just transfer the whole block.
450 if (In
.IsLimit() == false)
454 return !_error
->PendingError();
456 while (Go(true, File
) == true);
459 return Owner
->Flush() && !_error
->PendingError();
462 bool HttpServerState::ReadHeaderLines(std::string
&Data
) /*{{{*/
464 return In
.WriteTillEl(Data
);
467 bool HttpServerState::LoadNextResponse(bool const ToFile
, FileFd
* const File
)/*{{{*/
469 return Go(ToFile
, File
);
472 bool HttpServerState::WriteResponse(const std::string
&Data
) /*{{{*/
474 return Out
.Read(Data
);
477 bool HttpServerState::IsOpen() /*{{{*/
479 return (ServerFd
!= -1);
482 bool HttpServerState::InitHashes(FileFd
&File
) /*{{{*/
485 In
.Hash
= new Hashes
;
487 // Set the expected size and read file for the hashes
490 File
.Truncate(StartPos
);
492 return In
.Hash
->AddFD(File
, StartPos
);
497 Hashes
* HttpServerState::GetHashes() /*{{{*/
502 // HttpServerState::Die - The server has closed the connection. /*{{{*/
503 bool HttpServerState::Die(FileFd
&File
)
505 unsigned int LErrno
= errno
;
507 // Dump the buffer to the file
508 if (State
== ServerState::Data
)
510 // on GNU/kFreeBSD, apt dies on /dev/null because non-blocking
512 if (File
.Name() != "/dev/null")
513 SetNonBlock(File
.Fd(),false);
514 while (In
.WriteSpace() == true)
516 if (In
.Write(File
.Fd()) == false)
517 return _error
->Errno("write",_("Error writing to the file"));
520 if (In
.IsLimit() == true)
525 // See if this is because the server finished the data stream
526 if (In
.IsLimit() == false && State
!= HttpServerState::Header
&&
527 Encoding
!= HttpServerState::Closes
)
531 return _error
->Error(_("Error reading from server. Remote end closed connection"));
533 return _error
->Errno("read",_("Error reading from server"));
539 // Nothing left in the buffer
540 if (In
.WriteSpace() == false)
543 // We may have got multiple responses back in one packet..
551 // HttpServerState::Flush - Dump the buffer into the file /*{{{*/
552 // ---------------------------------------------------------------------
553 /* This takes the current input buffer from the Server FD and writes it
555 bool HttpServerState::Flush(FileFd
* const File
)
559 // on GNU/kFreeBSD, apt dies on /dev/null because non-blocking
561 if (File
->Name() != "/dev/null")
562 SetNonBlock(File
->Fd(),false);
563 if (In
.WriteSpace() == false)
566 while (In
.WriteSpace() == true)
568 if (In
.Write(File
->Fd()) == false)
569 return _error
->Errno("write",_("Error writing to file"));
570 if (In
.IsLimit() == true)
574 if (In
.IsLimit() == true || Encoding
== ServerState::Closes
)
580 // HttpServerState::Go - Run a single loop /*{{{*/
581 // ---------------------------------------------------------------------
582 /* This runs the select loop over the server FDs, Output file FDs and
584 bool HttpServerState::Go(bool ToFile
, FileFd
* const File
)
586 // Server has closed the connection
587 if (ServerFd
== -1 && (In
.WriteSpace() == false ||
595 /* Add the server. We only send more requests if the connection will
597 if (Out
.WriteSpace() == true && ServerFd
!= -1
598 && Persistent
== true)
599 FD_SET(ServerFd
,&wfds
);
600 if (In
.ReadSpace() == true && ServerFd
!= -1)
601 FD_SET(ServerFd
,&rfds
);
608 if (In
.WriteSpace() == true && ToFile
== true && FileFD
!= -1)
609 FD_SET(FileFD
,&wfds
);
612 if (_config
->FindB("Acquire::http::DependOnSTDIN", true) == true)
613 FD_SET(STDIN_FILENO
,&rfds
);
615 // Figure out the max fd
617 if (MaxFd
< ServerFd
)
625 if ((Res
= select(MaxFd
+1,&rfds
,&wfds
,0,&tv
)) < 0)
629 return _error
->Errno("select",_("Select failed"));
634 _error
->Error(_("Connection timed out"));
639 if (ServerFd
!= -1 && FD_ISSET(ServerFd
,&rfds
))
642 if (In
.Read(ServerFd
) == false)
646 if (ServerFd
!= -1 && FD_ISSET(ServerFd
,&wfds
))
649 if (Out
.Write(ServerFd
) == false)
653 // Send data to the file
654 if (FileFD
!= -1 && FD_ISSET(FileFD
,&wfds
))
656 if (In
.Write(FileFD
) == false)
657 return _error
->Errno("write",_("Error writing to output file"));
660 // Handle commands from APT
661 if (FD_ISSET(STDIN_FILENO
,&rfds
))
663 if (Owner
->Run(true) != -1)
671 // HttpMethod::SendReq - Send the HTTP request /*{{{*/
672 // ---------------------------------------------------------------------
673 /* This places the http request in the outbound buffer */
674 void HttpMethod::SendReq(FetchItem
*Itm
)
678 // The HTTP server expects a hostname with a trailing :port
682 if (Uri
.Host
.find(':') != string::npos
)
683 ProperHost
= '[' + Uri
.Host
+ ']';
685 ProperHost
= Uri
.Host
;
688 sprintf(Buf
,":%u",Uri
.Port
);
693 if (Itm
->Uri
.length() >= sizeof(Buf
))
696 /* RFC 2616 ยง5.1.2 requires absolute URIs for requests to proxies,
697 but while its a must for all servers to accept absolute URIs,
698 it is assumed clients will sent an absolute path for non-proxies */
699 std::string requesturi
;
700 if (Server
->Proxy
.empty() == true || Server
->Proxy
.Host
.empty())
701 requesturi
= Uri
.Path
;
703 requesturi
= Itm
->Uri
;
705 // The "+" is encoded as a workaround for a amazon S3 bug
706 // see LP bugs #1003633 and #1086997.
707 requesturi
= QuoteString(requesturi
, "+~ ");
709 /* Build the request. No keep-alive is included as it is the default
710 in 1.1, can cause problems with proxies, and we are an HTTP/1.1
712 C.f. https://tools.ietf.org/wg/httpbis/trac/ticket/158 */
713 sprintf(Buf
,"GET %s HTTP/1.1\r\nHost: %s\r\n",
714 requesturi
.c_str(),ProperHost
.c_str());
716 // generate a cache control header (if needed)
717 if (_config
->FindB("Acquire::http::No-Cache",false) == true)
719 strcat(Buf
,"Cache-Control: no-cache\r\nPragma: no-cache\r\n");
723 if (Itm
->IndexFile
== true)
725 sprintf(Buf
+strlen(Buf
),"Cache-Control: max-age=%u\r\n",
726 _config
->FindI("Acquire::http::Max-Age",0));
730 if (_config
->FindB("Acquire::http::No-Store",false) == true)
731 strcat(Buf
,"Cache-Control: no-store\r\n");
735 // If we ask for uncompressed files servers might respond with content-
736 // negotation which lets us end up with compressed files we do not support,
737 // see 657029, 657560 and co, so if we have no extension on the request
738 // ask for text only. As a sidenote: If there is nothing to negotate servers
739 // seem to be nice and ignore it.
740 if (_config
->FindB("Acquire::http::SendAccept", true) == true)
742 size_t const filepos
= Itm
->Uri
.find_last_of('/');
743 string
const file
= Itm
->Uri
.substr(filepos
+ 1);
744 if (flExtension(file
) == file
)
745 strcat(Buf
,"Accept: text/*\r\n");
750 // Check for a partial file
752 if (stat(Itm
->DestFile
.c_str(),&SBuf
) >= 0 && SBuf
.st_size
> 0)
754 // In this case we send an if-range query with a range header
755 sprintf(Buf
,"Range: bytes=%lli-\r\nIf-Range: %s\r\n",(long long)SBuf
.st_size
,
756 TimeRFC1123(SBuf
.st_mtime
).c_str());
761 if (Itm
->LastModified
!= 0)
763 sprintf(Buf
,"If-Modified-Since: %s\r\n",TimeRFC1123(Itm
->LastModified
).c_str());
768 if (Server
->Proxy
.User
.empty() == false || Server
->Proxy
.Password
.empty() == false)
769 Req
+= string("Proxy-Authorization: Basic ") +
770 Base64Encode(Server
->Proxy
.User
+ ":" + Server
->Proxy
.Password
) + "\r\n";
772 maybe_add_auth (Uri
, _config
->FindFile("Dir::Etc::netrc"));
773 if (Uri
.User
.empty() == false || Uri
.Password
.empty() == false)
775 Req
+= string("Authorization: Basic ") +
776 Base64Encode(Uri
.User
+ ":" + Uri
.Password
) + "\r\n";
778 Req
+= "User-Agent: " + _config
->Find("Acquire::http::User-Agent",
779 "Debian APT-HTTP/1.3 (" PACKAGE_VERSION
")") + "\r\n\r\n";
784 Server
->WriteResponse(Req
);
787 // HttpMethod::Configuration - Handle a configuration message /*{{{*/
788 // ---------------------------------------------------------------------
789 /* We stash the desired pipeline depth */
790 bool HttpMethod::Configuration(string Message
)
792 if (ServerMethod::Configuration(Message
) == false)
795 AllowRedirect
= _config
->FindB("Acquire::http::AllowRedirect",true);
796 PipelineDepth
= _config
->FindI("Acquire::http::Pipeline-Depth",
798 Debug
= _config
->FindB("Debug::Acquire::http",false);
800 // Get the proxy to use
806 // HttpMethod::AutoDetectProxy - auto detect proxy /*{{{*/
807 // ---------------------------------------------------------------------
809 bool HttpMethod::AutoDetectProxy()
811 // option is "Acquire::http::Proxy-Auto-Detect" but we allow the old
812 // name without the dash ("-")
813 AutoDetectProxyCmd
= _config
->Find("Acquire::http::Proxy-Auto-Detect",
814 _config
->Find("Acquire::http::ProxyAutoDetect"));
816 if (AutoDetectProxyCmd
.empty())
820 clog
<< "Using auto proxy detect command: " << AutoDetectProxyCmd
<< endl
;
822 int Pipes
[2] = {-1,-1};
823 if (pipe(Pipes
) != 0)
824 return _error
->Errno("pipe", "Failed to create Pipe");
826 pid_t Process
= ExecFork();
830 dup2(Pipes
[1],STDOUT_FILENO
);
831 SetCloseExec(STDOUT_FILENO
,false);
834 Args
[0] = AutoDetectProxyCmd
.c_str();
836 execv(Args
[0],(char **)Args
);
837 cerr
<< "Failed to exec method " << Args
[0] << endl
;
843 int res
= read(InFd
, buf
, sizeof(buf
)-1);
844 ExecWait(Process
, "ProxyAutoDetect", true);
847 return _error
->Errno("read", "Failed to read");
849 return _error
->Warning("ProxyAutoDetect returned no data");
855 clog
<< "auto detect command returned: '" << buf
<< "'" << endl
;
857 if (strstr(buf
, "http://") == buf
)
858 _config
->Set("Acquire::http::proxy", _strstrip(buf
));
863 ServerState
* HttpMethod::CreateServerState(URI uri
) /*{{{*/
865 return new HttpServerState(uri
, this);
868 void HttpMethod::RotateDNS() /*{{{*/