123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563 |
- // The path/filepath package uses either forward slashes or backslashes depending on the operating system
- // To process paths such as URLs that depend on forward slashes regardless of the OS, use the path package
- package filepath
- import "core:strings"
- SEPARATOR_CHARS :: `/\`
- // is_separator checks whether the byte is a valid separator character
- is_separator :: proc(c: byte) -> bool {
- switch c {
- case '/': return true
- case '\\': return ODIN_OS == .Windows
- }
- return false
- }
- @(private)
- is_slash :: proc(c: byte) -> bool {
- return c == '\\' || c == '/'
- }
- // Splits path immediate following the last separator; separating the path into a directory and file.
- // If no separator is found, `dir` will be empty and `path` set to `path`.
- split :: proc(path: string) -> (dir, file: string) {
- vol := volume_name(path)
- i := len(path) - 1
- for i >= len(vol) && !is_separator(path[i]) {
- i -= 1
- }
- return path[:i+1], path[i+1:]
- }
- /*
- Returns leading volume name.
- e.g.
- "C:\foo\bar\baz" will return "C:" on Windows.
- Everything else will be "".
- */
- volume_name :: proc(path: string) -> string {
- return path[:volume_name_len(path)]
- }
- // Returns the length of the volume name in bytes.
- volume_name_len :: proc(path: string) -> int {
- if ODIN_OS == .Windows {
- if len(path) < 2 {
- return 0
- }
- c := path[0]
- if path[1] == ':' {
- switch c {
- case 'a'..='z', 'A'..='Z':
- return 2
- }
- }
- // URL: https://msdn.microsoft.com/en-us/library/windows/desktop/aa365247(v=vs.85).aspx
- if l := len(path); l >= 5 && is_slash(path[0]) && is_slash(path[1]) &&
- !is_slash(path[2]) && path[2] != '.' {
- for n := 3; n < l-1; n += 1 {
- if is_slash(path[n]) {
- n += 1
- if !is_slash(path[n]) {
- if path[n] == '.' {
- break
- }
- }
- for ; n < l; n += 1 {
- if is_slash(path[n]) {
- break
- }
- }
- return n
- }
- break
- }
- }
- }
- return 0
- }
- /*
- Gets the file name and extension from a path.
- e.g.
- 'path/to/name.tar.gz' -> 'name.tar.gz'
- 'path/to/name.txt' -> 'name.txt'
- 'path/to/name' -> 'name'
- Returns "." if the path is an empty string.
- */
- base :: proc(path: string) -> string {
- if path == "" {
- return "."
- }
- path := path
- for len(path) > 0 && is_separator(path[len(path)-1]) {
- path = path[:len(path)-1]
- }
- path = path[volume_name_len(path):]
- i := len(path)-1
- for i >= 0 && !is_separator(path[i]) {
- i -= 1
- }
- if i >= 0 {
- path = path[i+1:]
- }
- if path == "" {
- return SEPARATOR_STRING
- }
- return path
- }
- /*
- Gets the name of a file from a path.
- The stem of a file is such that stem(path) + ext(path) = base(path).
- Only the last dot is considered when splitting the file extension.
- See `short_stem`.
- e.g.
- 'name.tar.gz' -> 'name.tar'
- 'name.txt' -> 'name'
- Returns an empty string if there is no stem. e.g: '.gitignore'.
- Returns an empty string if there's a trailing path separator.
- */
- stem :: proc(path: string) -> string {
- if len(path) > 0 && is_separator(path[len(path) - 1]) {
- // NOTE(tetra): Trailing separator
- return ""
- }
- // NOTE(tetra): Get the basename
- path := path
- if i := strings.last_index_any(path, SEPARATOR_CHARS); i != -1 {
- path = path[i+1:]
- }
- if i := strings.last_index_byte(path, '.'); i != -1 {
- return path[:i]
- }
- return path
- }
- /*
- Gets the name of a file from a path.
- The short stem is such that short_stem(path) + long_ext(path) = base(path).
- The first dot is used to split off the file extension, unlike `stem` which uses the last dot.
- e.g.
- 'name.tar.gz' -> 'name'
- 'name.txt' -> 'name'
- Returns an empty string if there is no stem. e.g: '.gitignore'.
- Returns an empty string if there's a trailing path separator.
- */
- short_stem :: proc(path: string) -> string {
- s := stem(path)
- if i := strings.index_byte(s, '.'); i != -1 {
- return s[:i]
- }
- return s
- }
- /*
- Gets the file extension from a path, including the dot.
- The file extension is such that stem(path) + ext(path) = base(path).
- Only the last dot is considered when splitting the file extension.
- See `long_ext`.
- e.g.
- 'name.tar.gz' -> '.gz'
- 'name.txt' -> '.txt'
- Returns an empty string if there is no dot.
- Returns an empty string if there is a trailing path separator.
- */
- ext :: proc(path: string) -> string {
- for i := len(path)-1; i >= 0 && !is_separator(path[i]); i -= 1 {
- if path[i] == '.' {
- return path[i:]
- }
- }
- return ""
- }
- /*
- Gets the file extension from a path, including the dot.
- The long file extension is such that short_stem(path) + long_ext(path) = base(path).
- The first dot is used to split off the file extension, unlike `ext` which uses the last dot.
- e.g.
- 'name.tar.gz' -> '.tar.gz'
- 'name.txt' -> '.txt'
- Returns an empty string if there is no dot.
- Returns an empty string if there is a trailing path separator.
- */
- long_ext :: proc(path: string) -> string {
- if len(path) > 0 && is_separator(path[len(path) - 1]) {
- // NOTE(tetra): Trailing separator
- return ""
- }
- // NOTE(tetra): Get the basename
- path := path
- if i := strings.last_index_any(path, SEPARATOR_CHARS); i != -1 {
- path = path[i+1:]
- }
- if i := strings.index_byte(path, '.'); i != -1 {
- return path[i:]
- }
- return ""
- }
- /*
- Returns the shortest path name equivalent to `path` through solely lexical processing.
- It applies the folliwng rules until none of them can be applied:
- * Replace multiple separators with a single one
- * Remove each current directory (`.`) path name element
- * Remove each inner parent directory (`..`) path and the preceding paths
- * Remove `..` that begin at the root of a path
- * All possible separators are replaced with the OS specific separator
- The return path ends in a slash only if it represents the root of a directory (`C:\` on Windows and `/` on *nix systems).
- If the result of the path is an empty string, the returned path with be `"."`.
- */
- clean :: proc(path: string, allocator := context.allocator) -> string {
- context.allocator = allocator
- path := path
- original_path := path
- vol_len := volume_name_len(path)
- path = path[vol_len:]
- if path == "" {
- if vol_len > 1 && original_path[1] != ':' {
- s, ok := from_slash(original_path)
- if !ok {
- s = strings.clone(s)
- }
- return s
- }
- return strings.concatenate({original_path, "."})
- }
- rooted := is_separator(path[0])
- n := len(path)
- out := &Lazy_Buffer{
- s = path,
- vol_and_path = original_path,
- vol_len = vol_len,
- }
- defer lazy_buffer_destroy(out)
- r, dot_dot := 0, 0
- if rooted {
- lazy_buffer_append(out, SEPARATOR)
- r, dot_dot = 1, 1
- }
- for r < n {
- switch {
- case is_separator(path[r]):
- r += 1
- case path[r] == '.' && (r+1 == n || is_separator(path[r+1])):
- r += 1
- case path[r] == '.' && path[r+1] == '.' && (r+2 == n || is_separator(path[r+2])):
- r += 2
- switch {
- case out.w > dot_dot:
- out.w -= 1
- for out.w > dot_dot && !is_separator(lazy_buffer_index(out, out.w)) {
- out.w -= 1
- }
- case !rooted:
- if out.w > 0 {
- lazy_buffer_append(out, SEPARATOR)
- }
- lazy_buffer_append(out, '.')
- lazy_buffer_append(out, '.')
- dot_dot = out.w
- }
- case:
- if rooted && out.w != 1 || !rooted && out.w != 0 {
- lazy_buffer_append(out, SEPARATOR)
- }
- for ; r < n && !is_separator(path[r]); r += 1 {
- lazy_buffer_append(out, path[r])
- }
- }
- }
- if out.w == 0 {
- lazy_buffer_append(out, '.')
- }
- s := lazy_buffer_string(out)
- cleaned, new_allocation := from_slash(s)
- if new_allocation {
- delete(s)
- }
- return cleaned
- }
- // Returns the result of replacing each forward slash `/` character in the path with the separate OS specific character.
- from_slash :: proc(path: string, allocator := context.allocator) -> (new_path: string, new_allocation: bool) {
- if SEPARATOR == '/' {
- return path, false
- }
- return strings.replace_all(path, "/", SEPARATOR_STRING, allocator)
- }
- // Returns the result of replacing each OS specific separator with a forward slash `/` character.
- to_slash :: proc(path: string, allocator := context.allocator) -> (new_path: string, new_allocation: bool) {
- if SEPARATOR == '/' {
- return path, false
- }
- return strings.replace_all(path, SEPARATOR_STRING, "/", allocator)
- }
- Relative_Error :: enum {
- None,
- Cannot_Relate,
- }
- /*
- Returns a relative path that is lexically equivalent to the `target_path` when joined with the `base_path` with an OS specific separator.
- e.g. `join(base_path, rel(base_path, target_path))` is equivalent to `target_path`
- On failure, the `Relative_Error` will be state it cannot compute the necessary relative path.
- */
- rel :: proc(base_path, target_path: string, allocator := context.allocator) -> (string, Relative_Error) {
- context.allocator = allocator
- base_clean, target_clean := clean(base_path), clean(target_path)
- delete_target := true
- defer {
- if delete_target {
- delete(target_clean)
- }
- delete(base_clean)
- }
- if strings.equal_fold(target_clean, base_clean) {
- return strings.clone("."), .None
- }
- base_vol, target_vol := volume_name(base_path), volume_name(target_path)
- base := base_clean[len(base_vol):]
- target := target_clean[len(target_vol):]
- if base == "." {
- base = ""
- }
- base_slashed := len(base) > 0 && base[0] == SEPARATOR
- target_slashed := len(target) > 0 && target[0] == SEPARATOR
- if base_slashed != target_slashed || !strings.equal_fold(base_vol, target_vol) {
- return "", .Cannot_Relate
- }
- bl, tl := len(base), len(target)
- b0, bi, t0, ti: int
- for {
- for bi < bl && base[bi] != SEPARATOR {
- bi += 1
- }
- for ti < tl && target[ti] != SEPARATOR {
- ti += 1
- }
- strings.equal_fold(target[t0:ti], base[b0:bi]) or_break
- if bi < bl {
- bi += 1
- }
- if ti < tl {
- ti += 1
- }
- b0, t0 = bi, ti
- }
- if base[b0:bi] == ".." {
- return "", .Cannot_Relate
- }
- if b0 != bl {
- seps := strings.count(base[b0:bl], SEPARATOR_STRING)
- size := 2 + seps*3
- if tl != t0 {
- size += 1 + tl - t0
- }
- buf := make([]byte, size)
- n := copy(buf, "..")
- for _ in 0..<seps {
- buf[n] = SEPARATOR
- copy(buf[n+1:], "..")
- n += 3
- }
- if t0 != tl {
- buf[n] = SEPARATOR
- copy(buf[n+1:], target[t0:])
- }
- return string(buf), .None
- }
- delete_target = false
- return target[t0:], .None
- }
- /*
- Returns all but the last element path, usually the path's directory. Once the final element has been removed,
- `dir` calls `clean` on the path and trailing separators are removed. If the path consists purely of separators,
- then `"."` is returned.
- */
- dir :: proc(path: string, allocator := context.allocator) -> string {
- context.allocator = allocator
- vol := volume_name(path)
- i := len(path) - 1
- for i >= len(vol) && !is_separator(path[i]) {
- i -= 1
- }
- dir := clean(path[len(vol) : i+1])
- defer delete(dir)
- if dir == "." && len(vol) > 2 {
- return strings.clone(vol)
- }
- return strings.concatenate({vol, dir})
- }
- // Splits the PATH-like `path` string, returning an array of its separated components (delete after use).
- // For Windows the separator is `;`, for Unix it's `:`.
- // An empty string returns nil. A non-empty string with no separators returns a 1-element array.
- // Any empty components will be included, e.g. `a::b` will return a 3-element array, as will `::`.
- // Separators within pairs of double-quotes will be ignored and stripped, e.g. `"a:b"c:d` will return []{`a:bc`, `d`}.
- split_list :: proc(path: string, allocator := context.allocator) -> []string {
- if path == "" {
- return nil
- }
- start: int
- quote: bool
- start, quote = 0, false
- count := 0
- for i := 0; i < len(path); i += 1 {
- c := path[i]
- switch {
- case c == '"':
- quote = !quote
- case c == LIST_SEPARATOR && !quote:
- count += 1
- }
- }
- start, quote = 0, false
- list := make([]string, count + 1, allocator)
- index := 0
- for i := 0; i < len(path); i += 1 {
- c := path[i]
- switch {
- case c == '"':
- quote = !quote
- case c == LIST_SEPARATOR && !quote:
- list[index] = path[start:i]
- index += 1
- start = i + 1
- }
- }
- assert(index == count)
- list[index] = path[start:]
- for s0, i in list {
- s, new := strings.replace_all(s0, `"`, ``, allocator)
- if !new {
- s = strings.clone(s, allocator)
- }
- list[i] = s
- }
- return list
- }
- /*
- Lazy_Buffer is a lazily made path buffer
- When it does allocate, it uses the context.allocator
- */
- @(private)
- Lazy_Buffer :: struct {
- s: string,
- b: []byte,
- w: int, // write index
- vol_and_path: string,
- vol_len: int,
- }
- @(private)
- lazy_buffer_index :: proc(lb: ^Lazy_Buffer, i: int) -> byte {
- if lb.b != nil {
- return lb.b[i]
- }
- return lb.s[i]
- }
- @(private)
- lazy_buffer_append :: proc(lb: ^Lazy_Buffer, c: byte) {
- if lb.b == nil {
- if lb.w < len(lb.s) && lb.s[lb.w] == c {
- lb.w += 1
- return
- }
- lb.b = make([]byte, len(lb.s))
- copy(lb.b, lb.s[:lb.w])
- }
- lb.b[lb.w] = c
- lb.w += 1
- }
- @(private)
- lazy_buffer_string :: proc(lb: ^Lazy_Buffer) -> string {
- if lb.b == nil {
- return strings.clone(lb.vol_and_path[:lb.vol_len+lb.w])
- }
- x := lb.vol_and_path[:lb.vol_len]
- y := string(lb.b[:lb.w])
- z := make([]byte, len(x)+len(y))
- copy(z, x)
- copy(z[len(x):], y)
- return string(z)
- }
- @(private)
- lazy_buffer_destroy :: proc(lb: ^Lazy_Buffer) {
- delete(lb.b)
- lb^ = {}
- }
|