mod field_type;
mod statistics;
use datamodel_renderer as render;
use futures::TryStreamExt;
use mongodb::{
bson::{doc, Document},
options::AggregateOptions,
Database,
};
use mongodb_schema_describer::MongoSchema;
use schema_connector::{warnings::Model, IntrospectionContext, IntrospectionResult, Warnings};
use statistics::*;
pub(super) async fn sample(
database: Database,
schema: MongoSchema,
ctx: &IntrospectionContext,
) -> Result<IntrospectionResult, mongodb::error::Error> {
let mut statistics = Statistics::new(ctx.composite_type_depth);
let mut warnings = Warnings::new();
for collection in schema.walk_collections() {
statistics.track_model(collection.name(), collection);
if collection.has_schema() {
warnings.json_schema_defined.push(Model {
model: collection.name().to_owned(),
})
}
if collection.is_capped() {
warnings.capped_collection.push(Model {
model: collection.name().to_owned(),
})
}
}
for collection in schema.walk_collections() {
let options = AggregateOptions::builder().allow_disk_use(Some(true)).build();
let mut documents = database
.collection::<Document>(collection.name())
.aggregate(vec![doc! { "$sample": { "size": SAMPLE_SIZE } }], Some(options))
.await?;
while let Some(document) = documents.try_next().await? {
statistics.track_model_fields(collection.name(), document);
}
for index in collection.indexes() {
statistics.track_index(collection.name(), index);
}
}
let mut data_model = render::Datamodel::default();
statistics.render(ctx.datasource(), &mut data_model, &mut warnings);
let psl_string = if ctx.render_config {
let config = render::Configuration::from_psl(ctx.configuration(), None);
format!("{config}\n{data_model}")
} else {
data_model.to_string()
};
let warnings = if !warnings.is_empty() {
Some(warnings.to_string())
} else {
None
};
Ok(IntrospectionResult {
data_model: psl::reformat(&psl_string, 2).unwrap(),
is_empty: data_model.is_empty(),
warnings,
views: None,
})
}