| // Copyright 2011 Google Inc. |
| // |
| // Licensed under the Apache License, Version 2.0 (the "License"); |
| // you may not use this file except in compliance with the License. |
| // You may obtain a copy of the License at |
| // |
| // http://www.apache.org/licenses/LICENSE-2.0 |
| // |
| // Unless required by applicable law or agreed to in writing, software |
| // distributed under the License is distributed on an "AS IS" BASIS, |
| // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. |
| // See the License for the specific language governing permissions and |
| // limitations under the License. |
| |
| // Author: jmarantz@google.com (Joshua Marantz) |
| |
| #include "pagespeed/kernel/http/response_headers_parser.h" |
| |
| #include "base/logging.h" |
| #include "pagespeed/kernel/base/message_handler.h" |
| #include "pagespeed/kernel/base/string.h" |
| #include "pagespeed/kernel/base/string_util.h" |
| #include "pagespeed/kernel/http/response_headers.h" |
| |
| namespace net_instaweb { |
| |
| void ResponseHeadersParser::Clear() { |
| parsing_http_ = false; |
| parsing_value_ = false; |
| headers_complete_ = false; |
| } |
| |
| // TODO(jmaessen): http://www.w3.org/Protocols/rfc2616/rfc2616-sec4.html#sec4.2 |
| // I bet we're doing this wrong: |
| // Header fields can be extended over multiple lines by preceding each extra |
| // line with at least one SP or HT. |
| int ResponseHeadersParser::ParseChunk(const StringPiece& text, |
| MessageHandler* handler) { |
| CHECK(!headers_complete_); |
| int num_consumed = 0; |
| int num_bytes = text.size(); |
| |
| for (; num_consumed < num_bytes; ++num_consumed) { |
| char c = text[num_consumed]; |
| if ((c == '/') && (parse_name_ == "HTTP")) { |
| if (response_headers_->has_major_version()) { |
| handler->MessageS(kError, "Multiple HTTP Lines"); |
| } else { |
| parsing_http_ = true; |
| parsing_value_ = true; |
| } |
| } else if (!parsing_value_ && (c == ':')) { |
| parsing_value_ = true; |
| } else if (c == '\r') { |
| // Just ignore CRs for now, and break up headers on newlines for |
| // simplicity. It's not clear to me if it's important that we |
| // reject headers that lack the CR in front of the LF. |
| } else if (c == '\n') { |
| if (parse_name_.empty()) { |
| // blank line. This marks the end of the headers. |
| ++num_consumed; |
| headers_complete_ = true; |
| response_headers_->ComputeCaching(); |
| break; |
| } |
| if (parsing_http_) { |
| response_headers_->ParseFirstLineHelper(parse_value_); |
| parsing_http_ = false; |
| } else { |
| response_headers_->Add(parse_name_, parse_value_); |
| } |
| parsing_value_ = false; |
| parse_name_.clear(); |
| parse_value_.clear(); |
| } else if (parsing_value_) { |
| // Skip leading whitespace (form feeds don't count, unlike html) |
| if (!parse_value_.empty() || !IsHtmlSpace(c) || c == '\f') { |
| parse_value_ += c; |
| } |
| } else { |
| parse_name_ += c; |
| } |
| } |
| return num_consumed; |
| } |
| |
| } // namespace net_instaweb |