2021-12-16 05:09:21 -05:00
|
|
|
// Copyright 2021 The Hugo Authors. All rights reserved.
|
|
|
|
//
|
|
|
|
// Licensed under the Apache License, Version 2.0 (the "License");
|
|
|
|
// you may not use this file except in compliance with the License.
|
|
|
|
// You may obtain a copy of the License at
|
|
|
|
// http://www.apache.org/licenses/LICENSE-2.0
|
|
|
|
//
|
|
|
|
// Unless required by applicable law or agreed to in writing, software
|
|
|
|
// distributed under the License is distributed on an "AS IS" BASIS,
|
|
|
|
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
|
|
// See the License for the specific language governing permissions and
|
|
|
|
// limitations under the License.
|
|
|
|
|
|
|
|
package create
|
|
|
|
|
|
|
|
import (
|
|
|
|
"bufio"
|
|
|
|
"bytes"
|
2022-05-02 10:07:52 -04:00
|
|
|
"fmt"
|
2021-12-16 05:09:21 -05:00
|
|
|
"io"
|
|
|
|
"mime"
|
|
|
|
"net/http"
|
|
|
|
"net/http/httputil"
|
|
|
|
"net/url"
|
|
|
|
"path"
|
|
|
|
"path/filepath"
|
|
|
|
"strings"
|
|
|
|
|
|
|
|
"github.com/gohugoio/hugo/common/hugio"
|
2022-04-11 04:34:08 -04:00
|
|
|
"github.com/gohugoio/hugo/common/maps"
|
2021-12-16 05:09:21 -05:00
|
|
|
"github.com/gohugoio/hugo/common/types"
|
2023-01-24 14:57:15 -05:00
|
|
|
"github.com/gohugoio/hugo/identity"
|
2021-12-16 09:12:13 -05:00
|
|
|
"github.com/gohugoio/hugo/media"
|
2021-12-16 05:09:21 -05:00
|
|
|
"github.com/gohugoio/hugo/resources"
|
|
|
|
"github.com/gohugoio/hugo/resources/resource"
|
|
|
|
"github.com/mitchellh/mapstructure"
|
|
|
|
)
|
|
|
|
|
2022-03-24 03:12:51 -04:00
|
|
|
type HTTPError struct {
|
|
|
|
error
|
|
|
|
Data map[string]any
|
|
|
|
|
|
|
|
StatusCode int
|
|
|
|
Body string
|
|
|
|
}
|
|
|
|
|
2023-01-16 05:05:28 -05:00
|
|
|
func responseToData(res *http.Response, readBody bool) map[string]any {
|
|
|
|
var body []byte
|
|
|
|
if readBody {
|
2023-02-18 17:43:26 -05:00
|
|
|
body, _ = io.ReadAll(res.Body)
|
2023-01-16 05:05:28 -05:00
|
|
|
}
|
|
|
|
|
|
|
|
m := map[string]any{
|
|
|
|
"StatusCode": res.StatusCode,
|
|
|
|
"Status": res.Status,
|
|
|
|
"TransferEncoding": res.TransferEncoding,
|
|
|
|
"ContentLength": res.ContentLength,
|
|
|
|
"ContentType": res.Header.Get("Content-Type"),
|
|
|
|
}
|
|
|
|
|
|
|
|
if readBody {
|
|
|
|
m["Body"] = string(body)
|
|
|
|
}
|
|
|
|
|
|
|
|
return m
|
|
|
|
|
|
|
|
}
|
|
|
|
|
|
|
|
func toHTTPError(err error, res *http.Response, readBody bool) *HTTPError {
|
2022-03-24 03:12:51 -04:00
|
|
|
if err == nil {
|
|
|
|
panic("err is nil")
|
|
|
|
}
|
|
|
|
if res == nil {
|
|
|
|
return &HTTPError{
|
|
|
|
error: err,
|
|
|
|
Data: map[string]any{},
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
return &HTTPError{
|
|
|
|
error: err,
|
2023-01-16 05:05:28 -05:00
|
|
|
Data: responseToData(res, readBody),
|
2022-03-24 03:12:51 -04:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2021-12-16 05:09:21 -05:00
|
|
|
// FromRemote expects one or n-parts of a URL to a resource
|
|
|
|
// If you provide multiple parts they will be joined together to the final URL.
|
2022-03-17 17:03:27 -04:00
|
|
|
func (c *Client) FromRemote(uri string, optionsm map[string]any) (resource.Resource, error) {
|
2021-12-16 05:09:21 -05:00
|
|
|
rURL, err := url.Parse(uri)
|
|
|
|
if err != nil {
|
2022-05-02 10:07:52 -04:00
|
|
|
return nil, fmt.Errorf("failed to parse URL for resource %s: %w", uri, err)
|
2021-12-16 05:09:21 -05:00
|
|
|
}
|
|
|
|
|
2023-01-16 05:05:28 -05:00
|
|
|
method := "GET"
|
|
|
|
if s, ok := maps.LookupEqualFold(optionsm, "method"); ok {
|
|
|
|
method = strings.ToUpper(s.(string))
|
|
|
|
}
|
|
|
|
isHeadMethod := method == "HEAD"
|
|
|
|
|
2022-04-11 04:34:08 -04:00
|
|
|
resourceID := calculateResourceID(uri, optionsm)
|
2021-12-16 05:09:21 -05:00
|
|
|
|
|
|
|
_, httpResponse, err := c.cacheGetResource.GetOrCreate(resourceID, func() (io.ReadCloser, error) {
|
|
|
|
options, err := decodeRemoteOptions(optionsm)
|
|
|
|
if err != nil {
|
2022-05-02 10:07:52 -04:00
|
|
|
return nil, fmt.Errorf("failed to decode options for resource %s: %w", uri, err)
|
2021-12-16 05:09:21 -05:00
|
|
|
}
|
|
|
|
if err := c.validateFromRemoteArgs(uri, options); err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
|
2023-01-16 05:00:55 -05:00
|
|
|
req, err := options.NewRequest(uri)
|
2021-12-16 05:09:21 -05:00
|
|
|
if err != nil {
|
2022-05-02 10:07:52 -04:00
|
|
|
return nil, fmt.Errorf("failed to create request for resource %s: %w", uri, err)
|
2021-12-16 05:09:21 -05:00
|
|
|
}
|
|
|
|
|
|
|
|
res, err := c.httpClient.Do(req)
|
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
2023-01-16 05:05:28 -05:00
|
|
|
defer res.Body.Close()
|
2021-12-16 05:09:21 -05:00
|
|
|
|
2022-03-24 03:12:51 -04:00
|
|
|
httpResponse, err := httputil.DumpResponse(res, true)
|
|
|
|
if err != nil {
|
2023-01-16 05:05:28 -05:00
|
|
|
return nil, toHTTPError(err, res, !isHeadMethod)
|
2022-03-24 03:12:51 -04:00
|
|
|
}
|
|
|
|
|
2021-12-16 05:09:21 -05:00
|
|
|
if res.StatusCode != http.StatusNotFound {
|
|
|
|
if res.StatusCode < 200 || res.StatusCode > 299 {
|
2023-01-16 05:05:28 -05:00
|
|
|
return nil, toHTTPError(fmt.Errorf("failed to fetch remote resource: %s", http.StatusText(res.StatusCode)), res, !isHeadMethod)
|
2021-12-16 05:09:21 -05:00
|
|
|
|
2022-03-24 03:12:51 -04:00
|
|
|
}
|
2021-12-16 05:09:21 -05:00
|
|
|
}
|
|
|
|
|
|
|
|
return hugio.ToReadCloser(bytes.NewReader(httpResponse)), nil
|
|
|
|
})
|
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
defer httpResponse.Close()
|
|
|
|
|
|
|
|
res, err := http.ReadResponse(bufio.NewReader(httpResponse), nil)
|
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
2023-01-16 05:05:28 -05:00
|
|
|
defer res.Body.Close()
|
2021-12-16 05:09:21 -05:00
|
|
|
|
|
|
|
if res.StatusCode == http.StatusNotFound {
|
|
|
|
// Not found. This matches how looksup for local resources work.
|
|
|
|
return nil, nil
|
|
|
|
}
|
|
|
|
|
2023-01-16 05:05:28 -05:00
|
|
|
var (
|
|
|
|
body []byte
|
|
|
|
mediaType media.Type
|
|
|
|
)
|
|
|
|
// A response to a HEAD method should not have a body. If it has one anyway, that body must be ignored.
|
|
|
|
// See https://developer.mozilla.org/en-US/docs/Web/HTTP/Methods/HEAD
|
|
|
|
if !isHeadMethod && res.Body != nil {
|
2023-02-18 17:43:26 -05:00
|
|
|
body, err = io.ReadAll(res.Body)
|
2023-01-16 05:05:28 -05:00
|
|
|
if err != nil {
|
|
|
|
return nil, fmt.Errorf("failed to read remote resource %q: %w", uri, err)
|
|
|
|
}
|
2021-12-16 05:09:21 -05:00
|
|
|
}
|
|
|
|
|
|
|
|
filename := path.Base(rURL.Path)
|
|
|
|
if _, params, _ := mime.ParseMediaType(res.Header.Get("Content-Disposition")); params != nil {
|
|
|
|
if _, ok := params["filename"]; ok {
|
|
|
|
filename = params["filename"]
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2021-12-21 04:35:33 -05:00
|
|
|
contentType := res.Header.Get("Content-Type")
|
|
|
|
|
2023-05-20 11:37:04 -04:00
|
|
|
// For HEAD requests we have no body to work with, so we need to use the Content-Type header.
|
|
|
|
if isHeadMethod || c.rs.ExecHelper.Sec().HTTP.MediaTypes.Accept(contentType) {
|
|
|
|
var found bool
|
|
|
|
mediaType, found = c.rs.MediaTypes().GetByType(contentType)
|
|
|
|
if !found {
|
|
|
|
// A media type not configured in Hugo, just create one from the content type string.
|
|
|
|
mediaType, _ = media.FromString(contentType)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
if mediaType.IsZero() {
|
2023-01-16 05:05:28 -05:00
|
|
|
|
|
|
|
var extensionHints []string
|
|
|
|
|
|
|
|
// mime.ExtensionsByType gives a long list of extensions for text/plain,
|
|
|
|
// just use ".txt".
|
|
|
|
if strings.HasPrefix(contentType, "text/plain") {
|
|
|
|
extensionHints = []string{".txt"}
|
|
|
|
} else {
|
|
|
|
exts, _ := mime.ExtensionsByType(contentType)
|
|
|
|
if exts != nil {
|
|
|
|
extensionHints = exts
|
|
|
|
}
|
2021-12-21 04:35:33 -05:00
|
|
|
}
|
2021-12-16 05:09:21 -05:00
|
|
|
|
2023-01-16 05:05:28 -05:00
|
|
|
// Look for a file extension. If it's .txt, look for a more specific.
|
|
|
|
if extensionHints == nil || extensionHints[0] == ".txt" {
|
|
|
|
if ext := path.Ext(filename); ext != "" {
|
|
|
|
extensionHints = []string{ext}
|
|
|
|
}
|
2021-12-16 05:09:21 -05:00
|
|
|
}
|
2023-01-16 05:05:28 -05:00
|
|
|
|
|
|
|
// Now resolve the media type primarily using the content.
|
2023-01-04 12:24:36 -05:00
|
|
|
mediaType = media.FromContent(c.rs.MediaTypes(), extensionHints, body)
|
2023-01-16 05:05:28 -05:00
|
|
|
|
2021-12-16 05:09:21 -05:00
|
|
|
}
|
|
|
|
|
2021-12-16 09:12:13 -05:00
|
|
|
if mediaType.IsZero() {
|
2022-05-02 10:07:52 -04:00
|
|
|
return nil, fmt.Errorf("failed to resolve media type for remote resource %q", uri)
|
2021-12-16 05:09:21 -05:00
|
|
|
}
|
|
|
|
|
2021-12-16 09:12:13 -05:00
|
|
|
resourceID = filename[:len(filename)-len(path.Ext(filename))] + "_" + resourceID + mediaType.FirstSuffix.FullSuffix
|
2023-01-16 06:44:39 -05:00
|
|
|
data := responseToData(res, false)
|
2021-12-16 05:09:21 -05:00
|
|
|
|
|
|
|
return c.rs.New(
|
|
|
|
resources.ResourceSourceDescriptor{
|
2021-12-16 09:12:13 -05:00
|
|
|
MediaType: mediaType,
|
2023-01-16 06:44:39 -05:00
|
|
|
Data: data,
|
2021-12-16 05:09:21 -05:00
|
|
|
LazyPublish: true,
|
|
|
|
OpenReadSeekCloser: func() (hugio.ReadSeekCloser, error) {
|
|
|
|
return hugio.NewReadSeekerNoOpCloser(bytes.NewReader(body)), nil
|
|
|
|
},
|
|
|
|
RelTargetFilename: filepath.Clean(resourceID),
|
|
|
|
})
|
|
|
|
}
|
|
|
|
|
|
|
|
func (c *Client) validateFromRemoteArgs(uri string, options fromRemoteOptions) error {
|
|
|
|
if err := c.rs.ExecHelper.Sec().CheckAllowedHTTPURL(uri); err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
|
|
|
if err := c.rs.ExecHelper.Sec().CheckAllowedHTTPMethod(options.Method); err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
2022-04-11 04:34:08 -04:00
|
|
|
func calculateResourceID(uri string, optionsm map[string]any) string {
|
|
|
|
if key, found := maps.LookupEqualFold(optionsm, "key"); found {
|
2023-01-24 14:57:15 -05:00
|
|
|
return identity.HashString(key)
|
2022-04-11 04:34:08 -04:00
|
|
|
}
|
2023-01-24 14:57:15 -05:00
|
|
|
return identity.HashString(uri, optionsm)
|
2022-04-11 04:34:08 -04:00
|
|
|
}
|
|
|
|
|
2023-01-16 05:00:55 -05:00
|
|
|
func addDefaultHeaders(req *http.Request) {
|
2021-12-16 05:09:21 -05:00
|
|
|
if !hasHeaderKey(req.Header, "User-Agent") {
|
|
|
|
req.Header.Add("User-Agent", "Hugo Static Site Generator")
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2022-03-17 17:03:27 -04:00
|
|
|
func addUserProvidedHeaders(headers map[string]any, req *http.Request) {
|
2021-12-16 05:09:21 -05:00
|
|
|
if headers == nil {
|
|
|
|
return
|
|
|
|
}
|
|
|
|
for key, val := range headers {
|
|
|
|
vals := types.ToStringSlicePreserveString(val)
|
|
|
|
for _, s := range vals {
|
|
|
|
req.Header.Add(key, s)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
func hasHeaderValue(m http.Header, key, value string) bool {
|
|
|
|
var s []string
|
|
|
|
var ok bool
|
|
|
|
|
|
|
|
if s, ok = m[key]; !ok {
|
|
|
|
return false
|
|
|
|
}
|
|
|
|
|
|
|
|
for _, v := range s {
|
|
|
|
if v == value {
|
|
|
|
return true
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return false
|
|
|
|
}
|
|
|
|
|
|
|
|
func hasHeaderKey(m http.Header, key string) bool {
|
|
|
|
_, ok := m[key]
|
|
|
|
return ok
|
|
|
|
}
|
|
|
|
|
|
|
|
type fromRemoteOptions struct {
|
|
|
|
Method string
|
2022-03-17 17:03:27 -04:00
|
|
|
Headers map[string]any
|
2021-12-16 05:09:21 -05:00
|
|
|
Body []byte
|
|
|
|
}
|
|
|
|
|
|
|
|
func (o fromRemoteOptions) BodyReader() io.Reader {
|
|
|
|
if o.Body == nil {
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
return bytes.NewBuffer(o.Body)
|
|
|
|
}
|
|
|
|
|
2023-01-16 05:00:55 -05:00
|
|
|
func (o fromRemoteOptions) NewRequest(url string) (*http.Request, error) {
|
|
|
|
req, err := http.NewRequest(o.Method, url, o.BodyReader())
|
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
|
|
|
|
// First add any user provided headers.
|
|
|
|
if o.Headers != nil {
|
|
|
|
addUserProvidedHeaders(o.Headers, req)
|
|
|
|
}
|
|
|
|
|
|
|
|
// Then add default headers not provided by the user.
|
|
|
|
addDefaultHeaders(req)
|
|
|
|
|
|
|
|
return req, nil
|
|
|
|
}
|
|
|
|
|
2022-03-17 17:03:27 -04:00
|
|
|
func decodeRemoteOptions(optionsm map[string]any) (fromRemoteOptions, error) {
|
2021-12-21 04:35:33 -05:00
|
|
|
options := fromRemoteOptions{
|
2021-12-16 05:09:21 -05:00
|
|
|
Method: "GET",
|
|
|
|
}
|
|
|
|
|
|
|
|
err := mapstructure.WeakDecode(optionsm, &options)
|
|
|
|
if err != nil {
|
|
|
|
return options, err
|
|
|
|
}
|
|
|
|
options.Method = strings.ToUpper(options.Method)
|
|
|
|
|
|
|
|
return options, nil
|
|
|
|
}
|