// Copyright 2019 The Hugo Authors. All rights reserved. // // Licensed under the Apache License, Version 2.0 (the "License"); // you may not use this file except in compliance with the License. // You may obtain a copy of the License at // http://www.apache.org/licenses/LICENSE-2.0 // // Unless required by applicable law or agreed to in writing, software // distributed under the License is distributed on an "AS IS" BASIS, // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. // See the License for the specific language governing permissions and // limitations under the License. package media import ( "encoding/json" "errors" "fmt" "net/http" "sort" "strings" "github.com/spf13/cast" "github.com/gohugoio/hugo/common/maps" "github.com/mitchellh/mapstructure" ) const ( defaultDelimiter = "." ) // Type (also known as MIME type and content type) is a two-part identifier for // file formats and format contents transmitted on the Internet. // For Hugo's use case, we use the top-level type name / subtype name + suffix. // One example would be application/svg+xml // If suffix is not provided, the sub type will be used. // See // https://en.wikipedia.org/wiki/Media_type type Type struct { MainType string `json:"mainType"` // i.e. text SubType string `json:"subType"` // i.e. html Delimiter string `json:"delimiter"` // e.g. "." // FirstSuffix holds the first suffix defined for this Type. FirstSuffix SuffixInfo `json:"firstSuffix"` // This is the optional suffix after the "+" in the MIME type, // e.g. "xml" in "application/rss+xml". mimeSuffix string // E.g. "jpg,jpeg" // Stored as a string to make Type comparable. suffixesCSV string } // SuffixInfo holds information about a Type's suffix. type SuffixInfo struct { Suffix string `json:"suffix"` FullSuffix string `json:"fullSuffix"` } // FromContent resolve the Type primarily using http.DetectContentType. // If http.DetectContentType resolves to application/octet-stream, a zero Type is returned. // If http.DetectContentType resolves to text/plain or application/xml, we try to get more specific using types and ext. func FromContent(types Types, ext string, content []byte) Type { ext = strings.TrimPrefix(ext, ".") t := strings.Split(http.DetectContentType(content), ";")[0] var m Type if t == "application/octet-stream" { return m } var found bool m, found = types.GetByType(t) if !found { if t == "text/xml" { // This is how it's configured in Hugo by default. m, found = types.GetByType("application/xml") } } if !found || ext == "" { return m } if m.Type() == "text/plain" || m.Type() == "application/xml" { // http.DetectContentType isn't brilliant when it comes to common text formats, so we need to do better. // For now we say that if it's detected to be a text format and the extension/content type in header reports // it to be a text format, then we use that. mm, _, found := types.GetFirstBySuffix(ext) if found && mm.IsText() { return mm } } return m } // FromStringAndExt creates a Type from a MIME string and a given extension. func FromStringAndExt(t, ext string) (Type, error) { tp, err := fromString(t) if err != nil { return tp, err } tp.suffixesCSV = strings.TrimPrefix(ext, ".") tp.Delimiter = defaultDelimiter tp.init() return tp, nil } // FromString creates a new Type given a type string on the form MainType/SubType and // an optional suffix, e.g. "text/html" or "text/html+html". func fromString(t string) (Type, error) { t = strings.ToLower(t) parts := strings.Split(t, "/") if len(parts) != 2 { return Type{}, fmt.Errorf("cannot parse %q as a media type", t) } mainType := parts[0] subParts := strings.Split(parts[1], "+") subType := strings.Split(subParts[0], ";")[0] var suffix string if len(subParts) > 1 { suffix = subParts[1] } return Type{MainType: mainType, SubType: subType, mimeSuffix: suffix}, nil } // Type returns a string representing the main- and sub-type of a media type, e.g. "text/css". // A suffix identifier will be appended after a "+" if set, e.g. "image/svg+xml". // Hugo will register a set of default media types. // These can be overridden by the user in the configuration, // by defining a media type with the same Type. func (m Type) Type() string { // Examples are // image/svg+xml // text/css if m.mimeSuffix != "" { return m.MainType + "/" + m.SubType + "+" + m.mimeSuffix } return m.MainType + "/" + m.SubType } func (m Type) String() string { return m.Type() } // Suffixes returns all valid file suffixes for this type. func (m Type) Suffixes() []string { if m.suffixesCSV == "" { return nil } return strings.Split(m.suffixesCSV, ",") } // IsText returns whether this Type is a text format. // Note that this may currently return false negatives. // TODO(bep) improve func (m Type) IsText() bool { if m.MainType == "text" { return true } switch m.SubType { case "javascript", "json", "rss", "xml", "svg", TOMLType.SubType, YAMLType.SubType: return true } return false } func (m *Type) init() { m.FirstSuffix.FullSuffix = "" m.FirstSuffix.Suffix = "" if suffixes := m.Suffixes(); suffixes != nil { m.FirstSuffix.Suffix = suffixes[0] m.FirstSuffix.FullSuffix = m.Delimiter + m.FirstSuffix.Suffix } } // WithDelimiterAndSuffixes is used in tests. func WithDelimiterAndSuffixes(t Type, delimiter, suffixesCSV string) Type { t.Delimiter = delimiter t.suffixesCSV = suffixesCSV t.init() return t } func newMediaType(main, sub string, suffixes []string) Type { t := Type{MainType: main, SubType: sub, suffixesCSV: strings.Join(suffixes, ","), Delimiter: defaultDelimiter} t.init() return t } func newMediaTypeWithMimeSuffix(main, sub, mimeSuffix string, suffixes []string) Type { mt := newMediaType(main, sub, suffixes) mt.mimeSuffix = mimeSuffix mt.init() return mt } // Definitions from https://developer.mozilla.org/en-US/docs/Web/HTTP/Basics_of_HTTP/MIME_types etc. // Note that from Hugo 0.44 we only set Suffix if it is part of the MIME type. var ( CalendarType = newMediaType("text", "calendar", []string{"ics"}) CSSType = newMediaType("text", "css", []string{"css"}) SCSSType = newMediaType("text", "x-scss", []string{"scss"}) SASSType = newMediaType("text", "x-sass", []string{"sass"}) CSVType = newMediaType("text", "csv", []string{"csv"}) HTMLType = newMediaType("text", "html", []string{"html"}) JavascriptType = newMediaType("application", "javascript", []string{"js"}) TypeScriptType = newMediaType("application", "typescript", []string{"ts"}) TSXType = newMediaType("text", "tsx", []string{"tsx"}) JSXType = newMediaType("text", "jsx", []string{"jsx"}) JSONType = newMediaType("application", "json", []string{"json"}) WebAppManifestType = newMediaTypeWithMimeSuffix("application", "manifest", "json", []string{"webmanifest"}) RSSType = newMediaTypeWithMimeSuffix("application", "rss", "xml", []string{"xml", "rss"}) XMLType = newMediaType("application", "xml", []string{"xml"}) SVGType = newMediaTypeWithMimeSuffix("image", "svg", "xml", []string{"svg"}) TextType = newMediaType("text", "plain", []string{"txt"}) TOMLType = newMediaType("application", "toml", []string{"toml"}) YAMLType = newMediaType("application", "yaml", []string{"yaml", "yml"}) // Common image types PNGType = newMediaType("image", "png", []string{"png"}) JPEGType = newMediaType("image", "jpeg", []string{"jpg", "jpeg", "jpe", "jif", "jfif"}) GIFType = newMediaType("image", "gif", []string{"gif"}) TIFFType = newMediaType("image", "tiff", []string{"tif", "tiff"}) BMPType = newMediaType("image", "bmp", []string{"bmp"}) WEBPType = newMediaType("image", "webp", []string{"webp"}) // Common font types TrueTypeFontType = newMediaType("font", "ttf", []string{"ttf"}) OpenTypeFontType = newMediaType("font", "otf", []string{"otf"}) // Common document types PDFType = newMediaType("application", "pdf", []string{"pdf"}) // Common video types AVIType = newMediaType("video", "x-msvideo", []string{"avi"}) MPEGType = newMediaType("video", "mpeg", []string{"mpg", "mpeg"}) MP4Type = newMediaType("video", "mp4", []string{"mp4"}) OGGType = newMediaType("video", "ogg", []string{"ogv"}) WEBMType = newMediaType("video", "webm", []string{"webm"}) GPPType = newMediaType("video", "3gpp", []string{"3gpp", "3gp"}) OctetType = newMediaType("application", "octet-stream", nil) ) // DefaultTypes is the default media types supported by Hugo. var DefaultTypes = Types{ CalendarType, CSSType, CSVType, SCSSType, SASSType, HTMLType, JavascriptType, TypeScriptType, TSXType, JSXType, JSONType, WebAppManifestType, RSSType, XMLType, SVGType, TextType, OctetType, YAMLType, TOMLType, PNGType, JPEGType, WEBPType, AVIType, MPEGType, MP4Type, OGGType, WEBMType, GPPType, OpenTypeFontType, TrueTypeFontType, PDFType, } func init() { sort.Sort(DefaultTypes) } // Types is a slice of media types. type Types []Type func (t Types) Len() int { return len(t) } func (t Types) Swap(i, j int) { t[i], t[j] = t[j], t[i] } func (t Types) Less(i, j int) bool { return t[i].Type() < t[j].Type() } // GetByType returns a media type for tp. func (t Types) GetByType(tp string) (Type, bool) { for _, tt := range t { if strings.EqualFold(tt.Type(), tp) { return tt, true } } if !strings.Contains(tp, "+") { // Try with the main and sub type parts := strings.Split(tp, "/") if len(parts) == 2 { return t.GetByMainSubType(parts[0], parts[1]) } } return Type{}, false } // BySuffix will return all media types matching a suffix. func (t Types) BySuffix(suffix string) []Type { suffix = strings.ToLower(suffix) var types []Type for _, tt := range t { if tt.hasSuffix(suffix) { types = append(types, tt) } } return types } // GetFirstBySuffix will return the first type matching the given suffix. func (t Types) GetFirstBySuffix(suffix string) (Type, SuffixInfo, bool) { suffix = strings.ToLower(suffix) for _, tt := range t { if tt.hasSuffix(suffix) { return tt, SuffixInfo{ FullSuffix: tt.Delimiter + suffix, Suffix: suffix, }, true } } return Type{}, SuffixInfo{}, false } // GetBySuffix gets a media type given as suffix, e.g. "html". // It will return false if no format could be found, or if the suffix given // is ambiguous. // The lookup is case insensitive. func (t Types) GetBySuffix(suffix string) (tp Type, si SuffixInfo, found bool) { suffix = strings.ToLower(suffix) for _, tt := range t { if tt.hasSuffix(suffix) { if found { // ambiguous found = false return } tp = tt si = SuffixInfo{ FullSuffix: tt.Delimiter + suffix, Suffix: suffix, } found = true } } return } func (m Type) hasSuffix(suffix string) bool { return strings.Contains(","+m.suffixesCSV+",", ","+suffix+",") } // GetByMainSubType gets a media type given a main and a sub type e.g. "text" and "plain". // It will return false if no format could be found, or if the combination given // is ambiguous. // The lookup is case insensitive. func (t Types) GetByMainSubType(mainType, subType string) (tp Type, found bool) { for _, tt := range t { if strings.EqualFold(mainType, tt.MainType) && strings.EqualFold(subType, tt.SubType) { if found { // ambiguous found = false return } tp = tt found = true } } return } func suffixIsRemoved() error { return errors.New(`MediaType.Suffix is removed. Before Hugo 0.44 this was used both to set a custom file suffix and as way to augment the mediatype definition (what you see after the "+", e.g. "image/svg+xml"). This had its limitations. For one, it was only possible with one file extension per MIME type. Now you can specify multiple file suffixes using "suffixes", but you need to specify the full MIME type identifier: [mediaTypes] [mediaTypes."image/svg+xml"] suffixes = ["svg", "abc" ] In most cases, it will be enough to just change: [mediaTypes] [mediaTypes."my/custom-mediatype"] suffix = "txt" To: [mediaTypes] [mediaTypes."my/custom-mediatype"] suffixes = ["txt"] Note that you can still get the Media Type's suffix from a template: {{ $mediaType.Suffix }}. But this will now map to the MIME type filename. `) } // DecodeTypes takes a list of media type configurations and merges those, // in the order given, with the Hugo defaults as the last resort. func DecodeTypes(mms ...map[string]interface{}) (Types, error) { var m Types // Maps type string to Type. Type string is the full application/svg+xml. mmm := make(map[string]Type) for _, dt := range DefaultTypes { mmm[dt.Type()] = dt } for _, mm := range mms { for k, v := range mm { var mediaType Type mediaType, found := mmm[k] if !found { var err error mediaType, err = fromString(k) if err != nil { return m, err } } if err := mapstructure.WeakDecode(v, &mediaType); err != nil { return m, err } vm := maps.ToStringMap(v) maps.PrepareParams(vm) _, delimiterSet := vm["delimiter"] _, suffixSet := vm["suffix"] if suffixSet { return Types{}, suffixIsRemoved() } if suffixes, found := vm["suffixes"]; found { mediaType.suffixesCSV = strings.TrimSpace(strings.ToLower(strings.Join(cast.ToStringSlice(suffixes), ","))) } // The user may set the delimiter as an empty string. if !delimiterSet && mediaType.suffixesCSV != "" { mediaType.Delimiter = defaultDelimiter } mediaType.init() mmm[k] = mediaType } } for _, v := range mmm { m = append(m, v) } sort.Sort(m) return m, nil } // IsZero reports whether this Type represents a zero value. func (m Type) IsZero() bool { return m.SubType == "" } // MarshalJSON returns the JSON encoding of m. func (m Type) MarshalJSON() ([]byte, error) { type Alias Type return json.Marshal(&struct { Alias Type string `json:"type"` String string `json:"string"` Suffixes []string `json:"suffixes"` }{ Alias: (Alias)(m), Type: m.Type(), String: m.String(), Suffixes: strings.Split(m.suffixesCSV, ","), }) }