| // Licensed to the Apache Software Foundation (ASF) under one |
| // or more contributor license agreements. See the NOTICE file |
| // distributed with this work for additional information |
| // regarding copyright ownership. The ASF licenses this file |
| // to you under the Apache License, Version 2.0 (the |
| // "License"); you may not use this file except in compliance |
| // with the License. You may obtain a copy of the License at |
| // |
| // http://www.apache.org/licenses/LICENSE-2.0 |
| // |
| // Unless required by applicable law or agreed to in writing, |
| // software distributed under the License is distributed on an |
| // "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY |
| // KIND, either express or implied. See the License for the |
| // specific language governing permissions and limitations |
| // under the License. |
| |
| use std::fmt::Debug; |
| use std::sync::Arc; |
| |
| use http::Request; |
| use http::Response; |
| use http::StatusCode; |
| |
| use crate::error::parse_error; |
| use opendal_core::raw::*; |
| use opendal_core::*; |
| |
| pub struct IpfsCore { |
| pub info: Arc<AccessorInfo>, |
| pub endpoint: String, |
| pub root: String, |
| } |
| |
| impl Debug for IpfsCore { |
| fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result { |
| f.debug_struct("IpfsCore") |
| .field("endpoint", &self.endpoint) |
| .field("root", &self.root) |
| .finish_non_exhaustive() |
| } |
| } |
| |
| impl IpfsCore { |
| pub async fn ipfs_get(&self, path: &str, range: BytesRange) -> Result<Response<HttpBody>> { |
| let p = build_rooted_abs_path(&self.root, path); |
| |
| let url = format!("{}{}", self.endpoint, percent_encode_path(&p)); |
| |
| let mut req = Request::get(&url); |
| |
| if !range.is_full() { |
| req = req.header(http::header::RANGE, range.to_header()); |
| } |
| |
| let req = req.body(Buffer::new()).map_err(new_request_build_error)?; |
| |
| self.info.http_client().fetch(req).await |
| } |
| |
| pub async fn ipfs_head(&self, path: &str) -> Result<Response<Buffer>> { |
| let p = build_rooted_abs_path(&self.root, path); |
| |
| let url = format!("{}{}", self.endpoint, percent_encode_path(&p)); |
| |
| let req = Request::head(&url); |
| |
| let req = req.body(Buffer::new()).map_err(new_request_build_error)?; |
| |
| self.info.http_client().send(req).await |
| } |
| |
| pub async fn ipfs_list(&self, path: &str) -> Result<Response<Buffer>> { |
| let p = build_rooted_abs_path(&self.root, path); |
| |
| let url = format!("{}{}", self.endpoint, percent_encode_path(&p)); |
| |
| let mut req = Request::get(&url); |
| |
| // Use "application/vnd.ipld.raw" to disable IPLD codec deserialization |
| // OpenDAL will parse ipld data directly. |
| // |
| // ref: https://github.com/ipfs/specs/blob/main/http-gateways/PATH_GATEWAY.md |
| req = req.header(http::header::ACCEPT, "application/vnd.ipld.raw"); |
| |
| let req = req.body(Buffer::new()).map_err(new_request_build_error)?; |
| |
| self.info.http_client().send(req).await |
| } |
| |
| /// IPFS's stat behavior highly depends on its implementation. |
| /// |
| /// Based on IPFS [Path Gateway Specification](https://github.com/ipfs/specs/blob/main/http-gateways/PATH_GATEWAY.md), |
| /// response payload could be: |
| /// |
| /// > - UnixFS (implicit default) |
| /// > - File |
| /// > - Bytes representing file contents |
| /// > - Directory |
| /// > - Generated HTML with directory index |
| /// > - When `index.html` is present, gateway can skip generating directory index and return it instead |
| /// > - Raw block (not this case) |
| /// > - CAR (not this case) |
| /// |
| /// When we HEAD a given path, we could have the following responses: |
| /// |
| /// - File |
| /// |
| /// ```http |
| /// :) curl -I https://ipfs.io/ipfs/QmPpCt1aYGb9JWJRmXRUnmJtVgeFFTJGzWFYEEX7bo9zGJ/normal_file |
| /// HTTP/1.1 200 Connection established |
| /// |
| /// HTTP/2 200 |
| /// server: openresty |
| /// date: Thu, 08 Sep 2022 00:48:50 GMT |
| /// content-type: application/octet-stream |
| /// content-length: 262144 |
| /// access-control-allow-methods: GET |
| /// cache-control: public, max-age=29030400, immutable |
| /// etag: "QmdP6teFTLSNVhT4W5jkhEuUBsjQ3xkp1GmRvDU6937Me1" |
| /// x-ipfs-gateway-host: ipfs-bank11-fr2 |
| /// x-ipfs-path: /ipfs/QmPpCt1aYGb9JWJRmXRUnmJtVgeFFTJGzWFYEEX7bo9zGJ/normal_file |
| /// x-ipfs-roots: QmPpCt1aYGb9JWJRmXRUnmJtVgeFFTJGzWFYEEX7bo9zGJ,QmdP6teFTLSNVhT4W5jkhEuUBsjQ3xkp1GmRvDU6937Me1 |
| /// x-ipfs-pop: ipfs-bank11-fr2 |
| /// timing-allow-origin: * |
| /// x-ipfs-datasize: 262144 |
| /// access-control-allow-origin: * |
| /// access-control-allow-methods: GET, POST, OPTIONS |
| /// access-control-allow-headers: X-Requested-With, Range, Content-Range, X-Chunked-Output, X-Stream-Output |
| /// access-control-expose-headers: Content-Range, X-Chunked-Output, X-Stream-Output |
| /// x-ipfs-lb-pop: gateway-bank1-fr2 |
| /// strict-transport-security: max-age=31536000; includeSubDomains; preload |
| /// x-proxy-cache: MISS |
| /// accept-ranges: bytes |
| /// ``` |
| /// |
| /// - Dir with generated index |
| /// |
| /// ```http |
| /// :( curl -I https://ipfs.io/ipfs/QmPpCt1aYGb9JWJRmXRUnmJtVgeFFTJGzWFYEEX7bo9zGJ/normal_dir |
| /// HTTP/1.1 200 Connection established |
| /// |
| /// HTTP/2 200 |
| /// server: openresty |
| /// date: Wed, 07 Sep 2022 08:46:13 GMT |
| /// content-type: text/html |
| /// vary: Accept-Encoding |
| /// access-control-allow-methods: GET |
| /// etag: "DirIndex-2b567f6r5vvdg_CID-QmY44DyCDymRN1Qy7sGbupz1ysMkXTWomAQku5vBg7fRQW" |
| /// x-ipfs-gateway-host: ipfs-bank6-sg1 |
| /// x-ipfs-path: /ipfs/QmPpCt1aYGb9JWJRmXRUnmJtVgeFFTJGzWFYEEX7bo9zGJ/normal_dir |
| /// x-ipfs-roots: QmPpCt1aYGb9JWJRmXRUnmJtVgeFFTJGzWFYEEX7bo9zGJ,QmY44DyCDymRN1Qy7sGbupz1ysMkXTWomAQku5vBg7fRQW |
| /// x-ipfs-pop: ipfs-bank6-sg1 |
| /// timing-allow-origin: * |
| /// access-control-allow-origin: * |
| /// access-control-allow-methods: GET, POST, OPTIONS |
| /// access-control-allow-headers: X-Requested-With, Range, Content-Range, X-Chunked-Output, X-Stream-Output |
| /// access-control-expose-headers: Content-Range, X-Chunked-Output, X-Stream-Output |
| /// x-ipfs-lb-pop: gateway-bank3-sg1 |
| /// strict-transport-security: max-age=31536000; includeSubDomains; preload |
| /// x-proxy-cache: MISS |
| /// ``` |
| /// |
| /// - Dir with index.html |
| /// |
| /// ```http |
| /// :) curl -I http://127.0.0.1:8080/ipfs/QmVturFGV3z4WsP7cRV8Ci4avCdGWYXk2qBKvtAwFUp5Az |
| /// HTTP/1.1 302 Found |
| /// Access-Control-Allow-Headers: Content-Type |
| /// Access-Control-Allow-Headers: Range |
| /// Access-Control-Allow-Headers: User-Agent |
| /// Access-Control-Allow-Headers: X-Requested-With |
| /// Access-Control-Allow-Methods: GET |
| /// Access-Control-Allow-Origin: * |
| /// Access-Control-Expose-Headers: Content-Length |
| /// Access-Control-Expose-Headers: Content-Range |
| /// Access-Control-Expose-Headers: X-Chunked-Output |
| /// Access-Control-Expose-Headers: X-Ipfs-Path |
| /// Access-Control-Expose-Headers: X-Ipfs-Roots |
| /// Access-Control-Expose-Headers: X-Stream-Output |
| /// Content-Type: text/html; charset=utf-8 |
| /// Location: /ipfs/QmVturFGV3z4WsP7cRV8Ci4avCdGWYXk2qBKvtAwFUp5Az/ |
| /// X-Ipfs-Path: /ipfs/QmVturFGV3z4WsP7cRV8Ci4avCdGWYXk2qBKvtAwFUp5Az |
| /// X-Ipfs-Roots: QmVturFGV3z4WsP7cRV8Ci4avCdGWYXk2qBKvtAwFUp5Az |
| /// Date: Thu, 08 Sep 2022 00:52:29 GMT |
| /// ``` |
| /// |
| /// In conclusion: |
| /// |
| /// - HTTP Status Code == 302 => directory |
| /// - HTTP Status Code == 200 && ETag starts with `"DirIndex` => directory |
| /// - HTTP Status Code == 200 && ETag not starts with `"DirIndex` => file |
| pub async fn ipfs_stat(&self, path: &str) -> Result<Metadata> { |
| // Stat root always returns a DIR. |
| if path == "/" { |
| return Ok(Metadata::new(EntryMode::DIR)); |
| } |
| |
| let resp = self.ipfs_head(path).await?; |
| let status = resp.status(); |
| |
| match status { |
| StatusCode::OK => { |
| let mut m = Metadata::new(EntryMode::Unknown); |
| |
| if let Some(v) = parse_content_length(resp.headers())? { |
| m.set_content_length(v); |
| } |
| |
| if let Some(v) = parse_content_type(resp.headers())? { |
| m.set_content_type(v); |
| } |
| |
| if let Some(v) = parse_etag(resp.headers())? { |
| m.set_etag(v); |
| |
| if v.starts_with("\"DirIndex") { |
| m.set_mode(EntryMode::DIR); |
| } else { |
| m.set_mode(EntryMode::FILE); |
| } |
| } else { |
| // Some service will stream the output of DirIndex. |
| // If we don't have an etag, it's highly to be a dir. |
| m.set_mode(EntryMode::DIR); |
| } |
| |
| if let Some(v) = parse_content_disposition(resp.headers())? { |
| m.set_content_disposition(v); |
| } |
| |
| Ok(m) |
| } |
| StatusCode::FOUND | StatusCode::MOVED_PERMANENTLY => Ok(Metadata::new(EntryMode::DIR)), |
| _ => Err(parse_error(resp)), |
| } |
| } |
| } |