// Copyright 2015 The Hugo Authors. All rights reserved. // // Licensed under the Apache License, Version 2.0 (the "License"); // you may not use this file except in compliance with the License. // You may obtain a copy of the License at // http://www.apache.org/licenses/LICENSE-2.0 // // Unless required by applicable law or agreed to in writing, software // distributed under the License is distributed on an "AS IS" BASIS, // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. // See the License for the specific language governing permissions and // limitations under the License. package helpers import ( "errors" "fmt" "io" "os" "path/filepath" "regexp" "strings" "unicode" "github.com/spf13/afero" "golang.org/x/text/transform" "golang.org/x/text/unicode/norm" ) var ( // ErrThemeUndefined is returned when a theme has not be defined by the user. ErrThemeUndefined = errors.New("no theme set") ErrWalkRootTooShort = errors.New("Path too short. Stop walking.") ) // filepathPathBridge is a bridge for common functionality in filepath vs path type filepathPathBridge interface { Base(in string) string Clean(in string) string Dir(in string) string Ext(in string) string Join(elem ...string) string Separator() string } type filepathBridge struct { } func (filepathBridge) Base(in string) string { return filepath.Base(in) } func (filepathBridge) Clean(in string) string { return filepath.Clean(in) } func (filepathBridge) Dir(in string) string { return filepath.Dir(in) } func (filepathBridge) Ext(in string) string { return filepath.Ext(in) } func (filepathBridge) Join(elem ...string) string { return filepath.Join(elem...) } func (filepathBridge) Separator() string { return FilePathSeparator } var fpb filepathBridge // MakePath takes a string with any characters and replace it // so the string could be used in a path. // It does so by creating a Unicode-sanitized string, with the spaces replaced, // whilst preserving the original casing of the string. // E.g. Social Media -> Social-Media func (p *PathSpec) MakePath(s string) string { return p.UnicodeSanitize(strings.Replace(strings.TrimSpace(s), " ", "-", -1)) } // MakePathSanitized creates a Unicode-sanitized string, with the spaces replaced func (p *PathSpec) MakePathSanitized(s string) string { if p.disablePathToLower { return p.MakePath(s) } return strings.ToLower(p.MakePath(s)) } // MakeTitle converts the path given to a suitable title, trimming whitespace // and replacing hyphens with whitespace. func MakeTitle(inpath string) string { return strings.Replace(strings.TrimSpace(inpath), "-", " ", -1) } // From https://golang.org/src/net/url/url.go func ishex(c rune) bool { switch { case '0' <= c && c <= '9': return true case 'a' <= c && c <= 'f': return true case 'A' <= c && c <= 'F': return true } return false } // UnicodeSanitize sanitizes string to be used in Hugo URL's, allowing only // a predefined set of special Unicode characters. // If RemovePathAccents configuration flag is enabled, Uniccode accents // are also removed. func (p *PathSpec) UnicodeSanitize(s string) string { source := []rune(s) target := make([]rune, 0, len(source)) for i, r := range source { if r == '%' && i+2 < len(source) && ishex(source[i+1]) && ishex(source[i+2]) { target = append(target, r) } else if unicode.IsLetter(r) || unicode.IsDigit(r) || unicode.IsMark(r) || r == '.' || r == '/' || r == '\\' || r == '_' || r == '-' || r == '#' || r == '+' || r == '~' { target = append(target, r) } } var result string if p.removePathAccents { // remove accents - see https://blog.golang.org/normalization t := transform.Chain(norm.NFD, transform.RemoveFunc(isMn), norm.NFC) result, _, _ = transform.String(t, string(target)) } else { result = string(target) } return result } func isMn(r rune) bool { return unicode.Is(unicode.Mn, r) // Mn: nonspacing marks } // ReplaceExtension takes a path and an extension, strips the old extension // and returns the path with the new extension. func ReplaceExtension(path string, newExt string) string { f, _ := fileAndExt(path, fpb) return f + "." + newExt } // AbsPathify creates an absolute path if given a relative path. If already // absolute, the path is just cleaned. func (p *PathSpec) AbsPathify(inPath string) string { if filepath.IsAbs(inPath) { return filepath.Clean(inPath) } // TODO(bep): Consider moving workingDir to argument list return filepath.Clean(filepath.Join(p.workingDir, inPath)) } // GetLayoutDirPath returns the absolute path to the layout file dir // for the current Hugo project. func (p *PathSpec) GetLayoutDirPath() string { return p.AbsPathify(p.layoutDir) } // GetStaticDirPath returns the absolute path to the static file dir // for the current Hugo project. func (p *PathSpec) GetStaticDirPath() string { return p.AbsPathify(p.staticDir) } // GetThemeDir gets the root directory of the current theme, if there is one. // If there is no theme, returns the empty string. func (p *PathSpec) GetThemeDir() string { if p.ThemeSet() { return p.AbsPathify(filepath.Join(p.themesDir, p.theme)) } return "" } // GetRelativeThemeDir gets the relative root directory of the current theme, if there is one. // If there is no theme, returns the empty string. func (p *PathSpec) GetRelativeThemeDir() string { if p.ThemeSet() { return strings.TrimPrefix(filepath.Join(p.themesDir, p.theme), FilePathSeparator) } return "" } // GetThemeStaticDirPath returns the theme's static dir path if theme is set. // If theme is set and the static dir doesn't exist, an error is returned. func (p *PathSpec) GetThemeStaticDirPath() (string, error) { return p.getThemeDirPath("static") } // GetThemeDataDirPath returns the theme's data dir path if theme is set. // If theme is set and the data dir doesn't exist, an error is returned. func (p *PathSpec) GetThemeDataDirPath() (string, error) { return p.getThemeDirPath("data") } // GetThemeI18nDirPath returns the theme's i18n dir path if theme is set. // If theme is set and the i18n dir doesn't exist, an error is returned. func (p *PathSpec) GetThemeI18nDirPath() (string, error) { return p.getThemeDirPath("i18n") } func (p *PathSpec) getThemeDirPath(path string) (string, error) { if !p.ThemeSet() { return "", ErrThemeUndefined } themeDir := filepath.Join(p.GetThemeDir(), path) if _, err := p.fs.Source.Stat(themeDir); os.IsNotExist(err) { return "", fmt.Errorf("Unable to find %s directory for theme %s in %s", path, p.theme, themeDir) } return themeDir, nil } // GetThemesDirPath gets the static files directory of the current theme, if there is one. // Ignores underlying errors. // TODO(bep) Candidate for deprecation? func (p *PathSpec) GetThemesDirPath() string { dir, _ := p.getThemeDirPath("static") return dir } // MakeStaticPathRelative makes a relative path to the static files directory. // It does so by taking either the project's static path or the theme's static // path into consideration. func (p *PathSpec) MakeStaticPathRelative(inPath string) (string, error) { staticDir := p.GetStaticDirPath() themeStaticDir := p.GetThemesDirPath() return makePathRelative(inPath, staticDir, themeStaticDir) } func makePathRelative(inPath string, possibleDirectories ...string) (string, error) { for _, currentPath := range possibleDirectories { if strings.HasPrefix(inPath, currentPath) { return strings.TrimPrefix(inPath, currentPath), nil } } return inPath, errors.New("Can't extract relative path, unknown prefix") } // Should be good enough for Hugo. var isFileRe = regexp.MustCompile(`.*\..{1,6}$`) // GetDottedRelativePath expects a relative path starting after the content directory. // It returns a relative path with dots ("..") navigating up the path structure. func GetDottedRelativePath(inPath string) string { inPath = filepath.Clean(filepath.FromSlash(inPath)) if inPath == "." { return "./" } if !isFileRe.MatchString(inPath) && !strings.HasSuffix(inPath, FilePathSeparator) { inPath += FilePathSeparator } if !strings.HasPrefix(inPath, FilePathSeparator) { inPath = FilePathSeparator + inPath } dir, _ := filepath.Split(inPath) sectionCount := strings.Count(dir, FilePathSeparator) if sectionCount == 0 || dir == FilePathSeparator { return "./" } var dottedPath string for i := 1; i < sectionCount; i++ { dottedPath += "../" } return dottedPath } // Filename takes a path, strips out the extension, // and returns the name of the file. func Filename(in string) (name string) { name, _ = fileAndExt(in, fpb) return } // FileAndExt returns the filename and any extension of a file path as // two separate strings. // // If the path, in, contains a directory name ending in a slash, // then both name and ext will be empty strings. // // If the path, in, is either the current directory, the parent // directory or the root directory, or an empty string, // then both name and ext will be empty strings. // // If the path, in, represents the path of a file without an extension, // then name will be the name of the file and ext will be an empty string. // // If the path, in, represents a filename with an extension, // then name will be the filename minus any extension - including the dot // and ext will contain the extension - minus the dot. func fileAndExt(in string, b filepathPathBridge) (name string, ext string) { ext = b.Ext(in) base := b.Base(in) return extractFilename(in, ext, base, b.Separator()), ext } func extractFilename(in, ext, base, pathSeparator string) (name string) { // No file name cases. These are defined as: // 1. any "in" path that ends in a pathSeparator // 2. any "base" consisting of just an pathSeparator // 3. any "base" consisting of just an empty string // 4. any "base" consisting of just the current directory i.e. "." // 5. any "base" consisting of just the parent directory i.e. ".." if (strings.LastIndex(in, pathSeparator) == len(in)-1) || base == "" || base == "." || base == ".." || base == pathSeparator { name = "" // there is NO filename } else if ext != "" { // there was an Extension // return the filename minus the extension (and the ".") name = base[:strings.LastIndex(base, ".")] } else { // no extension case so just return base, which willi // be the filename name = base } return } // GetRelativePath returns the relative path of a given path. func GetRelativePath(path, base string) (final string, err error) { if filepath.IsAbs(path) && base == "" { return "", errors.New("source: missing base directory") } name := filepath.Clean(path) base = filepath.Clean(base) name, err = filepath.Rel(base, name) if err != nil { return "", err } if strings.HasSuffix(filepath.FromSlash(path), FilePathSeparator) && !strings.HasSuffix(name, FilePathSeparator) { name += FilePathSeparator } return name, nil } // PaginateAliasPath creates a path used to access the aliases in the paginator. func (p *PathSpec) PaginateAliasPath(base string, page int) string { paginatePath := p.paginatePath uglify := p.uglyURLs var pth string if base != "" { pth = filepath.FromSlash(fmt.Sprintf("/%s/%s/%d", base, paginatePath, page)) } else { pth = filepath.FromSlash(fmt.Sprintf("/%s/%d", paginatePath, page)) } if uglify { pth += ".html" } return pth } // GuessSection returns the section given a source path. // A section is the part between the root slash and the second slash // or before the first slash. func GuessSection(in string) string { parts := strings.Split(in, FilePathSeparator) // This will include an empty entry before and after paths with leading and trailing slashes // eg... /sect/one/ -> ["", "sect", "one", ""] // Needs to have at least a value and a slash if len(parts) < 2 { return "" } // If it doesn't have a leading slash and value and file or trailing slash, then return "" if parts[0] == "" && len(parts) < 3 { return "" } // strip leading slash if parts[0] == "" { parts = parts[1:] } // if first directory is "content", return second directory if parts[0] == "content" { if len(parts) > 2 { return parts[1] } return "" } return parts[0] } // PathPrep prepares the path using the uglify setting to create paths on // either the form /section/name/index.html or /section/name.html. func PathPrep(ugly bool, in string) string { if ugly { return Uglify(in) } return PrettifyPath(in) } // PrettifyPath is the same as PrettifyURLPath but for file paths. // /section/name.html becomes /section/name/index.html // /section/name/ becomes /section/name/index.html // /section/name/index.html becomes /section/name/index.html func PrettifyPath(in string) string { return prettifyPath(in, fpb) } func prettifyPath(in string, b filepathPathBridge) string { if filepath.Ext(in) == "" { // /section/name/ -> /section/name/index.html if len(in) < 2 { return b.Separator() } return b.Join(b.Clean(in), "index.html") } name, ext := fileAndExt(in, b) if name == "index" { // /section/name/index.html -> /section/name/index.html return b.Clean(in) } // /section/name.html -> /section/name/index.html return b.Join(b.Dir(in), name, "index"+ext) } // ExtractRootPaths extracts the root paths from the supplied list of paths. // The resulting root path will not contain any file separators, but there // may be duplicates. // So "/content/section/" becomes "content" func ExtractRootPaths(paths []string) []string { r := make([]string, len(paths)) for i, p := range paths { root := filepath.ToSlash(p) sections := strings.Split(root, "/") for _, section := range sections { if section != "" { root = section break } } r[i] = root } return r } // FindCWD returns the current working directory from where the Hugo // executable is run. func FindCWD() (string, error) { serverFile, err := filepath.Abs(os.Args[0]) if err != nil { return "", fmt.Errorf("Can't get absolute path for executable: %v", err) } path := filepath.Dir(serverFile) realFile, err := filepath.EvalSymlinks(serverFile) if err != nil { if _, err = os.Stat(serverFile + ".exe"); err == nil { realFile = filepath.Clean(serverFile + ".exe") } } if err == nil && realFile != serverFile { path = filepath.Dir(realFile) } return path, nil } // SymbolicWalk is like filepath.Walk, but it supports the root being a // symbolic link. It will still not follow symbolic links deeper down in // the file structure func SymbolicWalk(fs afero.Fs, root string, walker filepath.WalkFunc) error { // Sanity check if len(root) < 4 { return ErrWalkRootTooShort } // Handle the root first fileInfo, realPath, err := getRealFileInfo(fs, root) if err != nil { return walker(root, nil, err) } if !fileInfo.IsDir() { return fmt.Errorf("Cannot walk regular file %s", root) } if err := walker(realPath, fileInfo, err); err != nil && err != filepath.SkipDir { return err } rootContent, err := afero.ReadDir(fs, root) if err != nil { return walker(root, nil, err) } for _, fi := range rootContent { if err := afero.Walk(fs, filepath.Join(root, fi.Name()), walker); err != nil { return err } } return nil } func getRealFileInfo(fs afero.Fs, path string) (os.FileInfo, string, error) { fileInfo, err := lstatIfOs(fs, path) realPath := path if err != nil { return nil, "", err } if fileInfo.Mode()&os.ModeSymlink == os.ModeSymlink { link, err := filepath.EvalSymlinks(path) if err != nil { return nil, "", fmt.Errorf("Cannot read symbolic link '%s', error was: %s", path, err) } fileInfo, err = lstatIfOs(fs, link) if err != nil { return nil, "", fmt.Errorf("Cannot stat '%s', error was: %s", link, err) } realPath = link } return fileInfo, realPath, nil } // GetRealPath returns the real file path for the given path, whether it is a // symlink or not. func GetRealPath(fs afero.Fs, path string) (string, error) { _, realPath, err := getRealFileInfo(fs, path) if err != nil { return "", err } return realPath, nil } // Code copied from Afero's path.go // if the filesystem is OsFs use Lstat, else use fs.Stat func lstatIfOs(fs afero.Fs, path string) (info os.FileInfo, err error) { _, ok := fs.(*afero.OsFs) if ok { info, err = os.Lstat(path) } else { info, err = fs.Stat(path) } return } // SafeWriteToDisk is the same as WriteToDisk // but it also checks to see if file/directory already exists. func SafeWriteToDisk(inpath string, r io.Reader, fs afero.Fs) (err error) { return afero.SafeWriteReader(fs, inpath, r) } // WriteToDisk writes content to disk. func WriteToDisk(inpath string, r io.Reader, fs afero.Fs) (err error) { return afero.WriteReader(fs, inpath, r) } // GetTempDir returns a temporary directory with the given sub path. func GetTempDir(subPath string, fs afero.Fs) string { return afero.GetTempDir(fs, subPath) } // DirExists checks if a path exists and is a directory. func DirExists(path string, fs afero.Fs) (bool, error) { return afero.DirExists(fs, path) } // IsDir checks if a given path is a directory. func IsDir(path string, fs afero.Fs) (bool, error) { return afero.IsDir(fs, path) } // IsEmpty checks if a given path is empty. func IsEmpty(path string, fs afero.Fs) (bool, error) { return afero.IsEmpty(fs, path) } // FileContains checks if a file contains a specified string. func FileContains(filename string, subslice []byte, fs afero.Fs) (bool, error) { return afero.FileContainsBytes(fs, filename, subslice) } // FileContainsAny checks if a file contains any of the specified strings. func FileContainsAny(filename string, subslices [][]byte, fs afero.Fs) (bool, error) { return afero.FileContainsAnyBytes(fs, filename, subslices) } // Exists checks if a file or directory exists. func Exists(path string, fs afero.Fs) (bool, error) { return afero.Exists(fs, path) }