Learn more  » Push, build, and install  RubyGems npm packages Python packages Maven artifacts PHP packages Go Modules Bower components Debian packages RPM packages NuGet packages

arrow-nightlies / pyarrow   python

Repository URL to install this package:

Version: 19.0.0.dev70 

/ include / arrow / filesystem / path_util.h

// Licensed to the Apache Software Foundation (ASF) under one
// or more contributor license agreements.  See the NOTICE file
// distributed with this work for additional information
// regarding copyright ownership.  The ASF licenses this file
// to you under the Apache License, Version 2.0 (the
// "License"); you may not use this file except in compliance
// with the License.  You may obtain a copy of the License at
//
//   http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing,
// software distributed under the License is distributed on an
// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
// KIND, either express or implied.  See the License for the
// specific language governing permissions and limitations
// under the License.

#pragma once

#include <optional>
#include <string>
#include <string_view>
#include <utility>
#include <vector>

#include "arrow/type_fwd.h"

namespace arrow {
namespace fs {
namespace internal {

constexpr char kSep = '/';

// Computations on abstract paths (not local paths with system-dependent behaviour).
// Abstract paths are typically used in URIs.

// Split an abstract path into its individual components.
ARROW_EXPORT
std::vector<std::string> SplitAbstractPath(const std::string& path, char sep = kSep);

// Slice the individual components of an abstract path and combine them
//
// If offset or length are negative then an empty string is returned
// If offset is >= the number of components then an empty string is returned
// If offset + length is >= the number of components then length is truncated
ARROW_EXPORT
std::string SliceAbstractPath(const std::string& path, int offset, int length,
                              char sep = kSep);

// Return the extension of the file
ARROW_EXPORT std::string GetAbstractPathExtension(const std::string& s);

// Return the depth (number of components) of an abstract path
//
// Trailing slashes do not count towards depth
// Leading slashes do not count towards depth
//
// The root path ("/") has depth 0
ARROW_EXPORT int GetAbstractPathDepth(std::string_view path);

// Return the parent directory and basename of an abstract path.  Both values may be
// empty.
ARROW_EXPORT
std::pair<std::string, std::string> GetAbstractPathParent(const std::string& s);

// Validate an abstract path.
ARROW_EXPORT
Status ValidateAbstractPath(std::string_view path);

// Validate the components of an abstract path.
ARROW_EXPORT
Status ValidateAbstractPathParts(const std::vector<std::string>& parts);

// Append a non-empty stem to an abstract path.
ARROW_EXPORT
std::string ConcatAbstractPath(std::string_view base, std::string_view stem);

// Make path relative to base, if it starts with base.  Otherwise error out.
ARROW_EXPORT
Result<std::string> MakeAbstractPathRelative(const std::string& base,
                                             const std::string& path);

ARROW_EXPORT
std::string EnsureLeadingSlash(std::string_view s);

ARROW_EXPORT
std::string_view RemoveLeadingSlash(std::string_view s);

ARROW_EXPORT
std::string EnsureTrailingSlash(std::string_view s);

/// \brief remove the forward slash (if any) from the given path
/// \param s the input path
/// \param preserve_root if true, allow a path of just "/" to remain unchanged
ARROW_EXPORT
std::string_view RemoveTrailingSlash(std::string_view s, bool preserve_root = false);

ARROW_EXPORT
Status AssertNoTrailingSlash(std::string_view s);

inline bool HasTrailingSlash(std::string_view s) {
  return !s.empty() && s.back() == kSep;
}

inline bool HasLeadingSlash(std::string_view s) {
  return !s.empty() && s.front() == kSep;
}

ARROW_EXPORT
bool IsAncestorOf(std::string_view ancestor, std::string_view descendant);

ARROW_EXPORT
std::optional<std::string_view> RemoveAncestor(std::string_view ancestor,
                                               std::string_view descendant);

/// Return a vector of ancestors between a base path and a descendant.
/// For example,
///
/// AncestorsFromBasePath("a/b", "a/b/c/d/e") -> ["a/b/c", "a/b/c/d"]
ARROW_EXPORT
std::vector<std::string> AncestorsFromBasePath(std::string_view base_path,
                                               std::string_view descendant);

/// Given a vector of paths of directories which must be created, produce a the minimal
/// subset for passing to CreateDir(recursive=true) by removing redundant parent
/// directories
ARROW_EXPORT
std::vector<std::string> MinimalCreateDirSet(std::vector<std::string> dirs);

// Join the components of an abstract path.
template <class StringIt>
std::string JoinAbstractPath(StringIt it, StringIt end, char sep = kSep) {
  std::string path;
  for (; it != end; ++it) {
    if (it->empty()) continue;

    if (!path.empty()) {
      path += sep;
    }
    path += *it;
  }
  return path;
}

template <class StringRange>
std::string JoinAbstractPath(const StringRange& range, char sep = kSep) {
  return JoinAbstractPath(range.begin(), range.end(), sep);
}

/// Convert slashes to backslashes, on all platforms.  Mostly useful for testing.
ARROW_EXPORT
std::string ToBackslashes(std::string_view s);

/// Ensure a local path is abstract, by converting backslashes to regular slashes
/// on Windows.  Return the path unchanged on other systems.
ARROW_EXPORT
std::string ToSlashes(std::string_view s);

ARROW_EXPORT
bool IsEmptyPath(std::string_view s);

ARROW_EXPORT
bool IsLikelyUri(std::string_view s);

class ARROW_EXPORT Globber {
 public:
  ~Globber();
  explicit Globber(std::string pattern);
  bool Matches(const std::string& path);

 protected:
  struct Impl;
  std::unique_ptr<Impl> impl_;
};

}  // namespace internal
}  // namespace fs
}  // namespace arrow