15
15
// specific language governing permissions and limitations
16
16
// under the License.
17
17
18
+ //! [`DataSource`] and [`DataSourceExec`]
19
+
18
20
use std:: any:: Any ;
19
21
use std:: fmt;
20
22
use std:: fmt:: { Debug , Formatter } ;
@@ -34,9 +36,15 @@ use datafusion_physical_expr::{EquivalenceProperties, Partitioning};
34
36
use datafusion_physical_expr_common:: sort_expr:: LexOrdering ;
35
37
36
38
/// Common behaviors in Data Sources for both from Files and Memory.
37
- /// See `DataSourceExec` for physical plan implementation
38
39
///
40
+ /// # See Also
41
+ /// * [`DataSourceExec`] for physical plan implementation
42
+ /// * [`FileSource`] for file format implementations (Parquet, Json, etc)
43
+ ///
44
+ /// # Notes
39
45
/// Requires `Debug` to assist debugging
46
+ ///
47
+ /// [`FileSource`]: crate::file::FileSource
40
48
pub trait DataSource : Send + Sync + Debug {
41
49
fn open (
42
50
& self ,
@@ -71,10 +79,21 @@ pub trait DataSource: Send + Sync + Debug {
71
79
) -> datafusion_common:: Result < Option < Arc < dyn ExecutionPlan > > > ;
72
80
}
73
81
74
- /// Unified data source for file formats like JSON, CSV, AVRO, ARROW, PARQUET
82
+ /// [`ExecutionPlan`] handles different file formats like JSON, CSV, AVRO, ARROW, PARQUET
83
+ ///
84
+ /// `DataSourceExec` implements common functionality such as applying projections,
85
+ /// and caching plan properties.
86
+ ///
87
+ /// The [`DataSource`] trait describes where to find the data for this data
88
+ /// source (for example what files or what in memory partitions). Format
89
+ /// specifics are implemented with the [`FileSource`] trait.
90
+ ///
91
+ /// [`FileSource`]: crate::file::FileSource
75
92
#[ derive( Clone , Debug ) ]
76
93
pub struct DataSourceExec {
94
+ /// The source of the data -- for example, `FileScanConfig` or `MemorySourceConfig`
77
95
data_source : Arc < dyn DataSource > ,
96
+ /// Cached plan properties such as sort order
78
97
cache : PlanProperties ,
79
98
}
80
99
0 commit comments