blob: 99019ddce58432b81c24395e55b316eabd155cba [file] [log] [blame]
/*
* Licensed to the Apache Software Foundation (ASF) under one
* or more contributor license agreements. See the NOTICE file
* distributed with this work for additional information
* regarding copyright ownership. The ASF licenses this file
* to you under the Apache License, Version 2.0 (the
* "License"); you may not use this file except in compliance
* with the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing,
* software distributed under the License is distributed on an
* "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
* KIND, either express or implied. See the License for the
* specific language governing permissions and limitations
* under the License.
*/
#include "pagespeed/kernel/http/response_headers_parser.h"
#include "base/logging.h"
#include "pagespeed/kernel/base/message_handler.h"
#include "pagespeed/kernel/base/string.h"
#include "pagespeed/kernel/base/string_util.h"
#include "pagespeed/kernel/http/response_headers.h"
namespace net_instaweb {
void ResponseHeadersParser::Clear() {
parsing_http_ = false;
parsing_value_ = false;
headers_complete_ = false;
}
// TODO(jmaessen): http://www.w3.org/Protocols/rfc2616/rfc2616-sec4.html#sec4.2
// I bet we're doing this wrong:
// Header fields can be extended over multiple lines by preceding each extra
// line with at least one SP or HT.
int ResponseHeadersParser::ParseChunk(const StringPiece& text,
MessageHandler* handler) {
CHECK(!headers_complete_);
int num_consumed = 0;
int num_bytes = text.size();
for (; num_consumed < num_bytes; ++num_consumed) {
char c = text[num_consumed];
if ((c == '/') && (parse_name_ == "HTTP")) {
if (response_headers_->has_major_version()) {
handler->MessageS(kError, "Multiple HTTP Lines");
} else {
parsing_http_ = true;
parsing_value_ = true;
}
} else if (!parsing_value_ && (c == ':')) {
parsing_value_ = true;
} else if (c == '\r') {
// Just ignore CRs for now, and break up headers on newlines for
// simplicity. It's not clear to me if it's important that we
// reject headers that lack the CR in front of the LF.
} else if (c == '\n') {
if (parse_name_.empty()) {
// blank line. This marks the end of the headers.
++num_consumed;
headers_complete_ = true;
response_headers_->ComputeCaching();
break;
}
if (parsing_http_) {
response_headers_->ParseFirstLineHelper(parse_value_);
parsing_http_ = false;
} else {
response_headers_->Add(parse_name_, parse_value_);
}
parsing_value_ = false;
parse_name_.clear();
parse_value_.clear();
} else if (parsing_value_) {
// Skip leading whitespace (form feeds don't count, unlike html)
if (!parse_value_.empty() || !IsHtmlSpace(c) || c == '\f') {
parse_value_ += c;
}
} else {
parse_name_ += c;
}
}
return num_consumed;
}
} // namespace net_instaweb