| /* |
| * Licensed to the Apache Software Foundation (ASF) under one |
| * or more contributor license agreements. See the NOTICE file |
| * distributed with this work for additional information |
| * regarding copyright ownership. The ASF licenses this file |
| * to you under the Apache License, Version 2.0 (the |
| * "License"); you may not use this file except in compliance |
| * with the License. You may obtain a copy of the License at |
| * |
| * http://www.apache.org/licenses/LICENSE-2.0 |
| * |
| * Unless required by applicable law or agreed to in writing, |
| * software distributed under the License is distributed on an |
| * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY |
| * KIND, either express or implied. See the License for the |
| * specific language governing permissions and limitations |
| * under the License. |
| */ |
| |
| #include "pagespeed/kernel/http/response_headers_parser.h" |
| |
| #include "base/logging.h" |
| #include "pagespeed/kernel/base/message_handler.h" |
| #include "pagespeed/kernel/base/string.h" |
| #include "pagespeed/kernel/base/string_util.h" |
| #include "pagespeed/kernel/http/response_headers.h" |
| |
| namespace net_instaweb { |
| |
| void ResponseHeadersParser::Clear() { |
| parsing_http_ = false; |
| parsing_value_ = false; |
| headers_complete_ = false; |
| } |
| |
| // TODO(jmaessen): http://www.w3.org/Protocols/rfc2616/rfc2616-sec4.html#sec4.2 |
| // I bet we're doing this wrong: |
| // Header fields can be extended over multiple lines by preceding each extra |
| // line with at least one SP or HT. |
| int ResponseHeadersParser::ParseChunk(const StringPiece& text, |
| MessageHandler* handler) { |
| CHECK(!headers_complete_); |
| int num_consumed = 0; |
| int num_bytes = text.size(); |
| |
| for (; num_consumed < num_bytes; ++num_consumed) { |
| char c = text[num_consumed]; |
| if ((c == '/') && (parse_name_ == "HTTP")) { |
| if (response_headers_->has_major_version()) { |
| handler->MessageS(kError, "Multiple HTTP Lines"); |
| } else { |
| parsing_http_ = true; |
| parsing_value_ = true; |
| } |
| } else if (!parsing_value_ && (c == ':')) { |
| parsing_value_ = true; |
| } else if (c == '\r') { |
| // Just ignore CRs for now, and break up headers on newlines for |
| // simplicity. It's not clear to me if it's important that we |
| // reject headers that lack the CR in front of the LF. |
| } else if (c == '\n') { |
| if (parse_name_.empty()) { |
| // blank line. This marks the end of the headers. |
| ++num_consumed; |
| headers_complete_ = true; |
| response_headers_->ComputeCaching(); |
| break; |
| } |
| if (parsing_http_) { |
| response_headers_->ParseFirstLineHelper(parse_value_); |
| parsing_http_ = false; |
| } else { |
| response_headers_->Add(parse_name_, parse_value_); |
| } |
| parsing_value_ = false; |
| parse_name_.clear(); |
| parse_value_.clear(); |
| } else if (parsing_value_) { |
| // Skip leading whitespace (form feeds don't count, unlike html) |
| if (!parse_value_.empty() || !IsHtmlSpace(c) || c == '\f') { |
| parse_value_ += c; |
| } |
| } else { |
| parse_name_ += c; |
| } |
| } |
| return num_consumed; |
| } |
| |
| } // namespace net_instaweb |