1 // -*- mode: cpp; mode: fold -*-
3 /* ######################################################################
5 HTTP and HTTPS share a lot of common code and these classes are
6 exactly the dumping ground for this common code
8 ##################################################################### */
10 // Include Files /*{{{*/
13 #include <apt-pkg/acquire-method.h>
14 #include <apt-pkg/configuration.h>
15 #include <apt-pkg/error.h>
16 #include <apt-pkg/fileutl.h>
17 #include <apt-pkg/strutl.h>
39 string
ServerMethod::FailFile
;
40 int ServerMethod::FailFd
= -1;
41 time_t ServerMethod::FailTime
= 0;
43 // ServerState::RunHeaders - Get the headers before the data /*{{{*/
44 // ---------------------------------------------------------------------
45 /* Returns 0 if things are OK, 1 if an IO error occurred and 2 if a header
46 parse error occurred */
47 ServerState::RunHeadersResult
ServerState::RunHeaders(FileFd
* const File
,
48 const std::string
&Uri
)
52 Owner
->Status(_("Waiting for headers"));
67 if (ReadHeaderLines(Data
) == false)
70 if (Owner
->Debug
== true)
71 clog
<< "Answer for: " << Uri
<< endl
<< Data
;
73 for (string::const_iterator I
= Data
.begin(); I
< Data
.end(); ++I
)
75 string::const_iterator J
= I
;
76 for (; J
!= Data
.end() && *J
!= '\n' && *J
!= '\r'; ++J
);
77 if (HeaderLine(string(I
,J
)) == false)
78 return RUN_HEADERS_PARSE_ERROR
;
82 // 100 Continue is a Nop...
86 // Tidy up the connection persistence state.
87 if (Encoding
== Closes
&& HaveContent
== true)
90 return RUN_HEADERS_OK
;
92 while (LoadNextResponse(false, File
) == true);
94 return RUN_HEADERS_IO_ERROR
;
97 // ServerState::HeaderLine - Process a header line /*{{{*/
98 // ---------------------------------------------------------------------
100 bool ServerState::HeaderLine(string Line
)
102 if (Line
.empty() == true)
105 string::size_type Pos
= Line
.find(' ');
106 if (Pos
== string::npos
|| Pos
+1 > Line
.length())
108 // Blah, some servers use "connection:closes", evil.
109 Pos
= Line
.find(':');
110 if (Pos
== string::npos
|| Pos
+ 2 > Line
.length())
111 return _error
->Error(_("Bad header line"));
115 // Parse off any trailing spaces between the : and the next word.
116 string::size_type Pos2
= Pos
;
117 while (Pos2
< Line
.length() && isspace_ascii(Line
[Pos2
]) != 0)
120 string Tag
= string(Line
,0,Pos
);
121 string Val
= string(Line
,Pos2
);
123 if (stringcasecmp(Tag
.c_str(),Tag
.c_str()+4,"HTTP") == 0)
125 // Evil servers return no version
128 int const elements
= sscanf(Line
.c_str(),"HTTP/%3u.%3u %3u%359[^\n]",&Major
,&Minor
,&Result
,Code
);
132 if (Owner
!= NULL
&& Owner
->Debug
== true)
133 clog
<< "HTTP server doesn't give Reason-Phrase for " << Result
<< std::endl
;
135 else if (elements
!= 4)
136 return _error
->Error(_("The HTTP server sent an invalid reply header"));
142 if (sscanf(Line
.c_str(),"HTTP %3u%359[^\n]",&Result
,Code
) != 2)
143 return _error
->Error(_("The HTTP server sent an invalid reply header"));
146 /* Check the HTTP response header to get the default persistence
152 if (Major
== 1 && Minor
== 0)
167 if (stringcasecmp(Tag
,"Content-Length:") == 0)
169 if (Encoding
== Closes
)
173 unsigned long long * DownloadSizePtr
= &DownloadSize
;
175 DownloadSizePtr
= &JunkSize
;
177 *DownloadSizePtr
= strtoull(Val
.c_str(), NULL
, 10);
178 if (*DownloadSizePtr
>= std::numeric_limits
<unsigned long long>::max())
179 return _error
->Errno("HeaderLine", _("The HTTP server sent an invalid Content-Length header"));
180 else if (*DownloadSizePtr
== 0)
183 // On partial content (206) the Content-Length less than the real
184 // size, so do not set it here but leave that to the Content-Range
186 if(Result
!= 206 && TotalFileSize
== 0)
187 TotalFileSize
= DownloadSize
;
192 if (stringcasecmp(Tag
,"Content-Type:") == 0)
198 if (stringcasecmp(Tag
,"Content-Range:") == 0)
202 // §14.16 says 'byte-range-resp-spec' should be a '*' in case of 416
203 if (Result
== 416 && sscanf(Val
.c_str(), "bytes */%llu",&TotalFileSize
) == 1)
204 ; // we got the expected filesize which is all we wanted
205 else if (sscanf(Val
.c_str(),"bytes %llu-%*u/%llu",&StartPos
,&TotalFileSize
) != 2)
206 return _error
->Error(_("The HTTP server sent an invalid Content-Range header"));
207 if ((unsigned long long)StartPos
> TotalFileSize
)
208 return _error
->Error(_("This HTTP server has broken range support"));
210 // figure out what we will download
211 DownloadSize
= TotalFileSize
- StartPos
;
215 if (stringcasecmp(Tag
,"Transfer-Encoding:") == 0)
218 if (stringcasecmp(Val
,"chunked") == 0)
223 if (stringcasecmp(Tag
,"Connection:") == 0)
225 if (stringcasecmp(Val
,"close") == 0)
227 if (stringcasecmp(Val
,"keep-alive") == 0)
232 if (stringcasecmp(Tag
,"Last-Modified:") == 0)
234 if (RFC1123StrToTime(Val
.c_str(), Date
) == false)
235 return _error
->Error(_("Unknown date format"));
239 if (stringcasecmp(Tag
,"Location:") == 0)
248 // ServerState::ServerState - Constructor /*{{{*/
249 ServerState::ServerState(URI Srv
, ServerMethod
*Owner
) : ServerName(Srv
), TimeOut(120), Owner(Owner
)
254 bool ServerState::AddPartialFileToHashes(FileFd
&File
) /*{{{*/
256 File
.Truncate(StartPos
);
257 return GetHashes()->AddFD(File
, StartPos
);
261 // ServerMethod::DealWithHeaders - Handle the retrieved header data /*{{{*/
262 // ---------------------------------------------------------------------
263 /* We look at the header data we got back from the server and decide what
264 to do. Returns DealWithHeadersResult (see http.h for details).
266 ServerMethod::DealWithHeadersResult
267 ServerMethod::DealWithHeaders(FetchResult
&Res
)
270 if (Server
->Result
== 304)
272 RemoveFile("server", Queue
->DestFile
);
274 Res
.LastModified
= Queue
->LastModified
;
280 * Note that it is only OK for us to treat all redirection the same
281 * because we *always* use GET, not other HTTP methods. There are
282 * three redirection codes for which it is not appropriate that we
283 * redirect. Pass on those codes so the error handling kicks in.
286 && (Server
->Result
> 300 && Server
->Result
< 400)
287 && (Server
->Result
!= 300 // Multiple Choices
288 && Server
->Result
!= 304 // Not Modified
289 && Server
->Result
!= 306)) // (Not part of HTTP/1.1, reserved)
291 if (Server
->Location
.empty() == true);
292 else if (Server
->Location
[0] == '/' && Queue
->Uri
.empty() == false)
294 URI Uri
= Queue
->Uri
;
295 if (Uri
.Host
.empty() == false)
296 NextURI
= URI::SiteOnly(Uri
);
299 NextURI
.append(DeQuoteString(Server
->Location
));
300 return TRY_AGAIN_OR_REDIRECT
;
304 NextURI
= DeQuoteString(Server
->Location
);
305 URI tmpURI
= NextURI
;
306 URI Uri
= Queue
->Uri
;
307 // same protocol redirects are okay
308 if (tmpURI
.Access
== Uri
.Access
)
309 return TRY_AGAIN_OR_REDIRECT
;
310 // as well as http to https
311 else if (Uri
.Access
== "http" && tmpURI
.Access
== "https")
312 return TRY_AGAIN_OR_REDIRECT
;
314 /* else pass through for error message */
316 // retry after an invalid range response without partial data
317 else if (Server
->Result
== 416)
320 if (stat(Queue
->DestFile
.c_str(),&SBuf
) >= 0 && SBuf
.st_size
> 0)
322 bool partialHit
= false;
323 if (Queue
->ExpectedHashes
.usable() == true)
325 Hashes
resultHashes(Queue
->ExpectedHashes
);
326 FileFd
file(Queue
->DestFile
, FileFd::ReadOnly
);
327 Server
->TotalFileSize
= file
.FileSize();
328 Server
->Date
= file
.ModificationTime();
329 resultHashes
.AddFD(file
);
330 HashStringList
const hashList
= resultHashes
.GetHashStringList();
331 partialHit
= (Queue
->ExpectedHashes
== hashList
);
333 else if ((unsigned long long)SBuf
.st_size
== Server
->TotalFileSize
)
335 if (partialHit
== true)
337 // the file is completely downloaded, but was not moved
338 if (Server
->HaveContent
== true)
340 // Send to error page to dev/null
341 FileFd
DevNull("/dev/null",FileFd::WriteExists
);
342 Server
->RunData(&DevNull
);
344 Server
->HaveContent
= false;
345 Server
->StartPos
= Server
->TotalFileSize
;
346 Server
->Result
= 200;
348 else if (RemoveFile("server", Queue
->DestFile
))
350 NextURI
= Queue
->Uri
;
351 return TRY_AGAIN_OR_REDIRECT
;
356 /* We have a reply we don't handle. This should indicate a perm server
358 if (Server
->Result
< 200 || Server
->Result
>= 300)
361 strprintf(err
, "HttpError%u", Server
->Result
);
363 _error
->Error("%u %s", Server
->Result
, Server
->Code
);
364 if (Server
->HaveContent
== true)
365 return ERROR_WITH_CONTENT_PAGE
;
366 return ERROR_UNRECOVERABLE
;
369 // This is some sort of 2xx 'data follows' reply
370 Res
.LastModified
= Server
->Date
;
371 Res
.Size
= Server
->TotalFileSize
;
375 File
= new FileFd(Queue
->DestFile
,FileFd::WriteAny
);
376 if (_error
->PendingError() == true)
377 return ERROR_NOT_FROM_SERVER
;
379 FailFile
= Queue
->DestFile
;
380 FailFile
.c_str(); // Make sure we don't do a malloc in the signal handler
382 FailTime
= Server
->Date
;
384 if (Server
->InitHashes(Queue
->ExpectedHashes
) == false || Server
->AddPartialFileToHashes(*File
) == false)
386 _error
->Errno("read",_("Problem hashing file"));
387 return ERROR_NOT_FROM_SERVER
;
389 if (Server
->StartPos
> 0)
390 Res
.ResumePoint
= Server
->StartPos
;
392 SetNonBlock(File
->Fd(),true);
396 // ServerMethod::SigTerm - Handle a fatal signal /*{{{*/
397 // ---------------------------------------------------------------------
398 /* This closes and timestamps the open file. This is necessary to get
399 resume behavoir on user abort */
400 void ServerMethod::SigTerm(int)
405 struct timeval times
[2];
406 times
[0].tv_sec
= FailTime
;
407 times
[1].tv_sec
= FailTime
;
408 times
[0].tv_usec
= times
[1].tv_usec
= 0;
409 utimes(FailFile
.c_str(), times
);
415 // ServerMethod::Fetch - Fetch an item /*{{{*/
416 // ---------------------------------------------------------------------
417 /* This adds an item to the pipeline. We keep the pipeline at a fixed
419 bool ServerMethod::Fetch(FetchItem
*)
424 // Queue the requests
426 for (FetchItem
*I
= Queue
; I
!= 0 && Depth
< (signed)PipelineDepth
;
427 I
= I
->Next
, Depth
++)
431 // If pipelining is disabled, we only queue 1 request
432 if (Server
->Pipeline
== false)
434 // if we have no hashes, do at most one such request
435 // as we can't fixup pipeling misbehaviors otherwise
436 else if (I
->ExpectedHashes
.usable() == false)
440 // Make sure we stick with the same server
441 if (Server
->Comp(I
->Uri
) == false)
454 // ServerMethod::Loop - Main loop /*{{{*/
455 int ServerMethod::Loop()
457 typedef vector
<string
> StringVector
;
458 typedef vector
<string
>::iterator StringVectorIterator
;
459 map
<string
, StringVector
> Redirected
;
461 signal(SIGTERM
,SigTerm
);
462 signal(SIGINT
,SigTerm
);
469 // We have no commands, wait for some to arrive
472 if (WaitFd(STDIN_FILENO
) == false)
476 /* Run messages, we can accept 0 (no message) if we didn't
477 do a WaitFd above.. Otherwise the FD is closed. */
478 int Result
= Run(true);
479 if (Result
!= -1 && (Result
!= 0 || Queue
== 0))
481 if(FailReason
.empty() == false ||
482 _config
->FindB("Acquire::http::DependOnSTDIN", true) == true)
491 // Connect to the server
492 if (Server
== 0 || Server
->Comp(Queue
->Uri
) == false)
493 Server
= CreateServerState(Queue
->Uri
);
495 /* If the server has explicitly said this is the last connection
496 then we pre-emptively shut down the pipeline and tear down
497 the connection. This will speed up HTTP/1.0 servers a tad
498 since we don't have to wait for the close sequence to
500 if (Server
->Persistent
== false)
503 // Reset the pipeline
504 if (Server
->IsOpen() == false)
507 // Connnect to the host
508 if (Server
->Open() == false)
515 // Fill the pipeline.
518 // Fetch the next URL header data from the server.
519 switch (Server
->RunHeaders(File
, Queue
->Uri
))
521 case ServerState::RUN_HEADERS_OK
:
524 // The header data is bad
525 case ServerState::RUN_HEADERS_PARSE_ERROR
:
527 _error
->Error(_("Bad header data"));
533 // The server closed a connection during the header get..
535 case ServerState::RUN_HEADERS_IO_ERROR
:
540 Server
->Pipeline
= false;
541 Server
->PipelineAllowed
= false;
543 if (FailCounter
>= 2)
545 Fail(_("Connection failed"),true);
554 // Decide what to do.
556 Res
.Filename
= Queue
->DestFile
;
557 switch (DealWithHeaders(Res
))
559 // Ok, the file is Open
567 // ensure we don't fetch too much
568 // we could do "Server->MaximumSize = Queue->MaximumSize" here
569 // but that would break the clever pipeline messup detection
570 // so instead we use the size of the biggest item in the queue
571 Server
->MaximumSize
= FindMaximumObjectSizeInQueue();
573 if (Server
->HaveContent
)
574 Result
= Server
->RunData(File
);
576 /* If the server is sending back sizeless responses then fill in
579 Res
.Size
= File
->Size();
581 // Close the file, destroy the FD object and timestamp it
587 struct timeval times
[2];
588 times
[0].tv_sec
= times
[1].tv_sec
= Server
->Date
;
589 times
[0].tv_usec
= times
[1].tv_usec
= 0;
590 utimes(Queue
->DestFile
.c_str(), times
);
592 // Send status to APT
595 Hashes
* const resultHashes
= Server
->GetHashes();
596 HashStringList
const hashList
= resultHashes
->GetHashStringList();
597 if (PipelineDepth
!= 0 && Queue
->ExpectedHashes
.usable() == true && Queue
->ExpectedHashes
!= hashList
)
599 // we did not get the expected hash… mhhh:
600 // could it be that server/proxy messed up pipelining?
601 FetchItem
* BeforeI
= Queue
;
602 for (FetchItem
*I
= Queue
->Next
; I
!= 0 && I
!= QueueBack
; I
= I
->Next
)
604 if (I
->ExpectedHashes
.usable() == true && I
->ExpectedHashes
== hashList
)
606 // yes, he did! Disable pipelining and rewrite queue
607 if (Server
->Pipeline
== true)
609 // FIXME: fake a warning message as we have no proper way of communicating here
611 strprintf(out
, _("Automatically disabled %s due to incorrect response from server/proxy. (man 5 apt.conf)"), "Acquire::http::PipelineDepth");
612 std::cerr
<< "W: " << out
<< std::endl
;
613 Server
->Pipeline
= false;
614 Server
->PipelineAllowed
= false;
615 // we keep the PipelineDepth value so that the rest of the queue can be fixed up as well
617 Rename(Res
.Filename
, I
->DestFile
);
618 Res
.Filename
= I
->DestFile
;
619 BeforeI
->Next
= I
->Next
;
627 Res
.TakeHashes(*resultHashes
);
632 if (Server
->IsOpen() == false)
638 if (FailCounter
>= 2)
640 Fail(_("Connection failed"),true);
662 // Hard server error, not found or something
663 case ERROR_UNRECOVERABLE
:
669 // Hard internal error, kill the connection and fail
670 case ERROR_NOT_FROM_SERVER
:
681 // We need to flush the data, the header is like a 404 w/ error text
682 case ERROR_WITH_CONTENT_PAGE
:
686 // Send to content to dev/null
687 File
= new FileFd("/dev/null",FileFd::WriteExists
);
688 Server
->RunData(File
);
694 // Try again with a new URL
695 case TRY_AGAIN_OR_REDIRECT
:
697 // Clear rest of response if there is content
698 if (Server
->HaveContent
)
700 File
= new FileFd("/dev/null",FileFd::WriteExists
);
701 Server
->RunData(File
);
706 /* Detect redirect loops. No more redirects are allowed
707 after the same URI is seen twice in a queue item. */
708 StringVector
&R
= Redirected
[Queue
->DestFile
];
709 bool StopRedirects
= false;
710 if (R
.empty() == true)
711 R
.push_back(Queue
->Uri
);
712 else if (R
[0] == "STOP" || R
.size() > 10)
713 StopRedirects
= true;
716 for (StringVectorIterator I
= R
.begin(); I
!= R
.end(); ++I
)
717 if (Queue
->Uri
== *I
)
723 R
.push_back(Queue
->Uri
);
726 if (StopRedirects
== false)
735 Fail(_("Internal error"));
745 unsigned long long ServerMethod::FindMaximumObjectSizeInQueue() const /*{{{*/
747 unsigned long long MaxSizeInQueue
= 0;
748 for (FetchItem
*I
= Queue
; I
!= 0 && I
!= QueueBack
; I
= I
->Next
)
749 MaxSizeInQueue
= std::max(MaxSizeInQueue
, I
->MaximumSize
);
750 return MaxSizeInQueue
;
753 ServerMethod::ServerMethod(char const * const Binary
, char const * const Ver
,unsigned long const Flags
) :/*{{{*/
754 aptMethod(Binary
, Ver
, Flags
), Server(nullptr), File(NULL
), PipelineDepth(10),
755 AllowRedirect(false), Debug(false)