risingwave_connector/source/filesystem/opendal_source/posix_fs_source.rs
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58
// Copyright 2024 RisingWave Labs
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
// http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.
use std::marker::PhantomData;
use anyhow::Context;
use opendal::layers::{LoggingLayer, RetryLayer};
use opendal::services::Fs;
use opendal::Operator;
use super::opendal_enumerator::OpendalEnumerator;
use super::{OpendalSource, PosixFsProperties};
use crate::error::ConnectorResult;
// Posix fs source should only be used for testing.
// For a single-CN cluster, the behavior is well-defined. It will read from the local file system.
// For a multi-CN cluster, each CN will read from its own local file system under the given directory.
impl<Src: OpendalSource> OpendalEnumerator<Src> {
/// create opendal posix fs source.
pub fn new_posix_fs_source(posix_fs_properties: PosixFsProperties) -> ConnectorResult<Self> {
// Create Fs builder.
let builder = Fs::default().root(&posix_fs_properties.root);
let op: Operator = Operator::new(builder)?
.layer(LoggingLayer::default())
.layer(RetryLayer::default())
.finish();
let (prefix, matcher) = if let Some(pattern) = posix_fs_properties.match_pattern.as_ref() {
// TODO(Kexiang): Currently, FsListnenr in opendal does not support a prefix. (Seems a bug in opendal)
// So we assign prefix to empty string.
let matcher = glob::Pattern::new(pattern)
.with_context(|| format!("Invalid match_pattern: {}", pattern))?;
(Some(String::new()), Some(matcher))
} else {
(None, None)
};
let compression_format = posix_fs_properties.compression_format;
Ok(Self {
op,
prefix,
matcher,
marker: PhantomData,
compression_format,
})
}
}