2014-12-26 22:40:10 -05:00
|
|
|
// Copyright © 2013-14 Steve Francia <spf@spf13.com>.
|
|
|
|
//
|
2015-11-23 22:16:36 -05:00
|
|
|
// Licensed under the Apache License, Version 2.0 (the "License");
|
2014-12-26 22:40:10 -05:00
|
|
|
// you may not use this file except in compliance with the License.
|
|
|
|
// You may obtain a copy of the License at
|
2015-11-23 22:16:36 -05:00
|
|
|
// http://www.apache.org/licenses/LICENSE-2.0
|
2014-12-26 22:40:10 -05:00
|
|
|
//
|
|
|
|
// Unless required by applicable law or agreed to in writing, software
|
|
|
|
// distributed under the License is distributed on an "AS IS" BASIS,
|
|
|
|
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
|
|
// See the License for the specific language governing permissions and
|
|
|
|
// limitations under the License.
|
|
|
|
|
|
|
|
package tpl
|
|
|
|
|
|
|
|
import (
|
|
|
|
"bytes"
|
|
|
|
"encoding/csv"
|
|
|
|
"encoding/json"
|
|
|
|
"errors"
|
|
|
|
"io/ioutil"
|
|
|
|
"net/http"
|
|
|
|
"net/url"
|
2015-06-26 06:23:37 -04:00
|
|
|
"os"
|
|
|
|
"path/filepath"
|
2014-12-26 22:40:10 -05:00
|
|
|
"strings"
|
|
|
|
"sync"
|
2015-05-28 01:36:06 -04:00
|
|
|
"time"
|
2014-12-26 22:40:10 -05:00
|
|
|
|
|
|
|
"github.com/spf13/afero"
|
|
|
|
"github.com/spf13/hugo/helpers"
|
|
|
|
"github.com/spf13/hugo/hugofs"
|
|
|
|
jww "github.com/spf13/jwalterweatherman"
|
|
|
|
"github.com/spf13/viper"
|
|
|
|
)
|
|
|
|
|
2015-05-28 01:36:06 -04:00
|
|
|
var (
|
|
|
|
remoteURLLock = &remoteLock{m: make(map[string]*sync.Mutex)}
|
|
|
|
resSleep = time.Second * 2 // if JSON decoding failed sleep for n seconds before retrying
|
|
|
|
resRetries = 1 // number of retries to load the JSON from URL or local file system
|
|
|
|
)
|
2014-12-26 22:40:10 -05:00
|
|
|
|
|
|
|
type remoteLock struct {
|
|
|
|
sync.RWMutex
|
|
|
|
m map[string]*sync.Mutex
|
|
|
|
}
|
|
|
|
|
2015-03-18 01:16:54 -04:00
|
|
|
// URLLock locks an URL during download
|
2015-03-11 13:34:57 -04:00
|
|
|
func (l *remoteLock) URLLock(url string) {
|
2014-12-26 22:40:10 -05:00
|
|
|
l.Lock()
|
|
|
|
if _, ok := l.m[url]; !ok {
|
|
|
|
l.m[url] = &sync.Mutex{}
|
|
|
|
}
|
|
|
|
l.Unlock() // call this Unlock before the next lock will be called. NFI why but defer doesn't work.
|
|
|
|
l.m[url].Lock()
|
|
|
|
}
|
|
|
|
|
2015-03-18 01:16:54 -04:00
|
|
|
// URLUnlock unlocks an URL when the download has been finished. Use only in defer calls.
|
2015-03-11 13:34:57 -04:00
|
|
|
func (l *remoteLock) URLUnlock(url string) {
|
2014-12-26 22:40:10 -05:00
|
|
|
l.RLock()
|
|
|
|
defer l.RUnlock()
|
|
|
|
if um, ok := l.m[url]; ok {
|
|
|
|
um.Unlock()
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2015-03-18 01:16:54 -04:00
|
|
|
// getCacheFileID returns the cache ID for a string
|
2014-12-26 22:40:10 -05:00
|
|
|
func getCacheFileID(id string) string {
|
|
|
|
return viper.GetString("CacheDir") + url.QueryEscape(id)
|
|
|
|
}
|
|
|
|
|
|
|
|
// resGetCache returns the content for an ID from the file cache or an error
|
|
|
|
// if the file is not found returns nil,nil
|
2015-02-02 04:14:59 -05:00
|
|
|
func resGetCache(id string, fs afero.Fs, ignoreCache bool) ([]byte, error) {
|
|
|
|
if ignoreCache {
|
|
|
|
return nil, nil
|
|
|
|
}
|
2014-12-26 22:40:10 -05:00
|
|
|
fID := getCacheFileID(id)
|
|
|
|
isExists, err := helpers.Exists(fID, fs)
|
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
if !isExists {
|
|
|
|
return nil, nil
|
|
|
|
}
|
|
|
|
|
|
|
|
f, err := fs.Open(fID)
|
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
|
|
|
|
return ioutil.ReadAll(f)
|
|
|
|
}
|
|
|
|
|
|
|
|
// resWriteCache writes bytes to an ID into the file cache
|
|
|
|
func resWriteCache(id string, c []byte, fs afero.Fs) error {
|
|
|
|
fID := getCacheFileID(id)
|
|
|
|
f, err := fs.Create(fID)
|
|
|
|
if err != nil {
|
2015-05-28 01:36:06 -04:00
|
|
|
return errors.New("Error: " + err.Error() + ". Failed to create file: " + fID)
|
2014-12-26 22:40:10 -05:00
|
|
|
}
|
2015-05-28 01:36:06 -04:00
|
|
|
defer f.Close()
|
2014-12-26 22:40:10 -05:00
|
|
|
n, err := f.Write(c)
|
|
|
|
if n == 0 {
|
|
|
|
return errors.New("No bytes written to file: " + fID)
|
|
|
|
}
|
2015-05-28 01:36:06 -04:00
|
|
|
if err != nil {
|
|
|
|
return errors.New("Error: " + err.Error() + ". Failed to write to file: " + fID)
|
|
|
|
}
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
|
|
|
func resDeleteCache(id string, fs afero.Fs) error {
|
|
|
|
return fs.Remove(getCacheFileID(id))
|
2014-12-26 22:40:10 -05:00
|
|
|
}
|
|
|
|
|
|
|
|
// resGetRemote loads the content of a remote file. This method is thread safe.
|
|
|
|
func resGetRemote(url string, fs afero.Fs, hc *http.Client) ([]byte, error) {
|
|
|
|
|
2015-02-02 04:14:59 -05:00
|
|
|
c, err := resGetCache(url, fs, viper.GetBool("IgnoreCache"))
|
2014-12-26 22:40:10 -05:00
|
|
|
if c != nil && err == nil {
|
|
|
|
return c, nil
|
|
|
|
}
|
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
|
|
|
|
// avoid race condition with locks, block other goroutines if the current url is processing
|
2015-03-11 13:34:57 -04:00
|
|
|
remoteURLLock.URLLock(url)
|
|
|
|
defer func() { remoteURLLock.URLUnlock(url) }()
|
2014-12-26 22:40:10 -05:00
|
|
|
|
|
|
|
// avoid multiple locks due to calling resGetCache twice
|
2015-02-02 04:14:59 -05:00
|
|
|
c, err = resGetCache(url, fs, viper.GetBool("IgnoreCache"))
|
2014-12-26 22:40:10 -05:00
|
|
|
if c != nil && err == nil {
|
|
|
|
return c, nil
|
|
|
|
}
|
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
|
|
|
|
jww.INFO.Printf("Downloading: %s ...", url)
|
|
|
|
res, err := hc.Get(url)
|
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
c, err = ioutil.ReadAll(res.Body)
|
|
|
|
res.Body.Close()
|
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
err = resWriteCache(url, c, fs)
|
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
jww.INFO.Printf("... and cached to: %s", getCacheFileID(url))
|
|
|
|
return c, nil
|
|
|
|
}
|
|
|
|
|
|
|
|
// resGetLocal loads the content of a local file
|
|
|
|
func resGetLocal(url string, fs afero.Fs) ([]byte, error) {
|
|
|
|
p := ""
|
|
|
|
if viper.GetString("WorkingDir") != "" {
|
|
|
|
p = viper.GetString("WorkingDir")
|
|
|
|
if helpers.FilePathSeparator != p[len(p)-1:] {
|
|
|
|
p = p + helpers.FilePathSeparator
|
|
|
|
}
|
|
|
|
}
|
|
|
|
jFile := p + url
|
|
|
|
if e, err := helpers.Exists(jFile, fs); !e {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
|
|
|
|
f, err := fs.Open(jFile)
|
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
return ioutil.ReadAll(f)
|
|
|
|
}
|
|
|
|
|
|
|
|
// resGetResource loads the content of a local or remote file
|
|
|
|
func resGetResource(url string) ([]byte, error) {
|
|
|
|
if url == "" {
|
|
|
|
return nil, nil
|
|
|
|
}
|
|
|
|
if strings.Contains(url, "://") {
|
|
|
|
return resGetRemote(url, hugofs.SourceFs, http.DefaultClient)
|
|
|
|
}
|
|
|
|
return resGetLocal(url, hugofs.SourceFs)
|
|
|
|
}
|
|
|
|
|
2015-03-18 01:16:54 -04:00
|
|
|
// GetJSON expects one or n-parts of a URL to a resource which can either be a local or a remote one.
|
2015-02-07 23:33:30 -05:00
|
|
|
// If you provide multiple parts they will be joined together to the final URL.
|
2015-03-18 01:16:54 -04:00
|
|
|
// GetJSON returns nil or parsed JSON to use in a short code.
|
2015-03-11 13:34:57 -04:00
|
|
|
func GetJSON(urlParts ...string) interface{} {
|
2015-05-28 01:36:06 -04:00
|
|
|
var v interface{}
|
2015-02-07 23:33:30 -05:00
|
|
|
url := strings.Join(urlParts, "")
|
2014-12-26 22:40:10 -05:00
|
|
|
|
2015-05-28 01:36:06 -04:00
|
|
|
for i := 0; i <= resRetries; i++ {
|
|
|
|
c, err := resGetResource(url)
|
|
|
|
if err != nil {
|
|
|
|
jww.ERROR.Printf("Failed to get json resource %s with error message %s", url, err)
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
|
|
|
err = json.Unmarshal(c, &v)
|
|
|
|
if err != nil {
|
|
|
|
jww.ERROR.Printf("Cannot read json from resource %s with error message %s", url, err)
|
|
|
|
jww.ERROR.Printf("Retry #%d for %s and sleeping for %s", i, url, resSleep)
|
|
|
|
time.Sleep(resSleep)
|
|
|
|
resDeleteCache(url, hugofs.SourceFs)
|
|
|
|
continue
|
|
|
|
}
|
|
|
|
break
|
2014-12-26 22:40:10 -05:00
|
|
|
}
|
|
|
|
return v
|
|
|
|
}
|
|
|
|
|
2015-03-18 01:16:54 -04:00
|
|
|
// parseCSV parses bytes of CSV data into a slice slice string or an error
|
2015-03-11 13:34:57 -04:00
|
|
|
func parseCSV(c []byte, sep string) ([][]string, error) {
|
2014-12-26 22:40:10 -05:00
|
|
|
if len(sep) != 1 {
|
|
|
|
return nil, errors.New("Incorrect length of csv separator: " + sep)
|
|
|
|
}
|
|
|
|
b := bytes.NewReader(c)
|
|
|
|
r := csv.NewReader(b)
|
|
|
|
rSep := []rune(sep)
|
|
|
|
r.Comma = rSep[0]
|
|
|
|
r.FieldsPerRecord = 0
|
|
|
|
return r.ReadAll()
|
|
|
|
}
|
|
|
|
|
2015-03-18 01:16:54 -04:00
|
|
|
// GetCSV expects a data separator and one or n-parts of a URL to a resource which
|
2015-02-07 23:33:30 -05:00
|
|
|
// can either be a local or a remote one.
|
|
|
|
// The data separator can be a comma, semi-colon, pipe, etc, but only one character.
|
|
|
|
// If you provide multiple parts for the URL they will be joined together to the final URL.
|
2015-03-18 01:16:54 -04:00
|
|
|
// GetCSV returns nil or a slice slice to use in a short code.
|
2015-03-11 13:34:57 -04:00
|
|
|
func GetCSV(sep string, urlParts ...string) [][]string {
|
2015-05-28 01:36:06 -04:00
|
|
|
var d [][]string
|
2015-02-07 23:33:30 -05:00
|
|
|
url := strings.Join(urlParts, "")
|
2015-05-28 01:36:06 -04:00
|
|
|
|
|
|
|
var clearCacheSleep = func(i int, u string) {
|
|
|
|
jww.ERROR.Printf("Retry #%d for %s and sleeping for %s", i, url, resSleep)
|
|
|
|
time.Sleep(resSleep)
|
|
|
|
resDeleteCache(url, hugofs.SourceFs)
|
2014-12-26 22:40:10 -05:00
|
|
|
}
|
2015-05-28 01:36:06 -04:00
|
|
|
|
|
|
|
for i := 0; i <= resRetries; i++ {
|
|
|
|
c, err := resGetResource(url)
|
|
|
|
|
|
|
|
if err == nil && false == bytes.Contains(c, []byte(sep)) {
|
|
|
|
err = errors.New("Cannot find separator " + sep + " in CSV.")
|
|
|
|
}
|
|
|
|
|
|
|
|
if err != nil {
|
|
|
|
jww.ERROR.Printf("Failed to read csv resource %s with error message %s", url, err)
|
|
|
|
clearCacheSleep(i, url)
|
|
|
|
continue
|
|
|
|
}
|
|
|
|
|
|
|
|
if d, err = parseCSV(c, sep); err != nil {
|
|
|
|
jww.ERROR.Printf("Failed to parse csv file %s with error message %s", url, err)
|
|
|
|
clearCacheSleep(i, url)
|
|
|
|
continue
|
|
|
|
}
|
|
|
|
break
|
2014-12-26 22:40:10 -05:00
|
|
|
}
|
|
|
|
return d
|
|
|
|
}
|
2015-06-26 06:23:37 -04:00
|
|
|
|
|
|
|
func ReadDir(path string) []os.FileInfo {
|
2015-08-06 16:46:01 -04:00
|
|
|
wd := ""
|
|
|
|
p := ""
|
2015-06-26 06:23:37 -04:00
|
|
|
if viper.GetString("WorkingDir") != "" {
|
|
|
|
wd = viper.GetString("WorkingDir")
|
|
|
|
}
|
2015-08-06 16:46:01 -04:00
|
|
|
if strings.Contains(path, "..") {
|
|
|
|
jww.ERROR.Printf("Path %s contains parent directory marker", path)
|
2015-06-26 06:23:37 -04:00
|
|
|
return nil
|
2015-08-06 16:46:01 -04:00
|
|
|
}
|
2015-06-26 06:23:37 -04:00
|
|
|
|
|
|
|
p = filepath.Clean(path)
|
|
|
|
p = filepath.Join(wd, p)
|
|
|
|
|
|
|
|
list, err := ioutil.ReadDir(p)
|
|
|
|
if err != nil {
|
|
|
|
jww.ERROR.Printf("Failed to read Directory %s with error message %s", path, err)
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
return list
|
|
|
|
}
|