// Licensed to the Apache Software Foundation (ASF) under one // or more contributor license agreements. See the NOTICE file // distributed with this work for additional information // regarding copyright ownership. The ASF licenses this file // to you under the Apache License, Version 2.0 (the // "License"); you may not use this file except in compliance // with the License. You may obtain a copy of the License at // // http://www.apache.org/licenses/LICENSE-2.0 // // Unless required by applicable law or agreed to in writing, // software distributed under the License is distributed on an // "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY // KIND, either express or implied. See the License for the // specific language governing permissions and limitations // under the License. // This API is EXPERIMENTAL. #pragma once #include #include #include "arrow/compute/type_fwd.h" // IWYU pragma: export #include "arrow/dataset/visibility.h" #include "arrow/filesystem/type_fwd.h" // IWYU pragma: export #include "arrow/type_fwd.h" // IWYU pragma: export namespace arrow { namespace dataset { class Dataset; class DatasetFactory; using DatasetVector = std::vector>; class UnionDataset; class UnionDatasetFactory; class Fragment; using FragmentIterator = Iterator>; using FragmentVector = std::vector>; class FragmentScanOptions; class FileSource; class FileFormat; class FileFragment; class FileWriter; class FileWriteOptions; class FileSystemDataset; class FileSystemDatasetFactory; struct FileSystemDatasetWriteOptions; class WriteNodeOptions; /// \brief Controls what happens if files exist in an output directory during a dataset /// write enum class ExistingDataBehavior : int8_t { /// Deletes all files in a directory the first time that directory is encountered kDeleteMatchingPartitions, /// Ignores existing files, overwriting any that happen to have the same name as an /// output file kOverwriteOrIgnore, /// Returns an error if there are any files or subdirectories in the output directory kError, }; class InMemoryDataset; class CsvFileFormat; class CsvFileWriter; class CsvFileWriteOptions; struct CsvFragmentScanOptions; class JsonFileFormat; class JsonFileWriter; class JsonFileWriteOptions; struct JsonFragmentScanOptions; class IpcFileFormat; class IpcFileWriter; class IpcFileWriteOptions; class IpcFragmentScanOptions; class ParquetFileFormat; class ParquetFileFragment; class ParquetFragmentScanOptions; class ParquetFileWriter; class ParquetFileWriteOptions; class Partitioning; class PartitioningFactory; class PartitioningOrFactory; struct KeyValuePartitioningOptions; class DirectoryPartitioning; class HivePartitioning; struct HivePartitioningOptions; class FilenamePartitioning; struct FilenamePartitioningOptions; class ScanNodeOptions; struct ScanOptions; class Scanner; class ScannerBuilder; class ScanTask; using ScanTaskVector = std::vector>; using ScanTaskIterator = Iterator>; } // namespace dataset } // namespace arrow