JSON twin: https://www.healthaidb.com/software/ydata.json
YData
https://ydata.ai/products/platform.html
YData Fabric is a data‑centric AI platform that provides data profiling, quality tooling and synthetic data generation to enable safe sharing, augmentation and bias mitigation for healthcare and pharma use cases.
Commercial platform (YData Fabric and SDK) for generating statistically accurate synthetic tabular and time‑series healthcare data, profiling and data cataloging, pipelines and model‑ready dataset creation; supports on‑prem/cloud deployment to keep PHI inside customer infrastructure and is marketed to healthcare and life‑sciences organisations for data sharing, augmentation, de‑biasing and ML model development.
yes
2019
Customer-selectable regions (US and EU backups mentioned); supports deploying in customer's AWS/Azure/GCP region (BYO cloud region)
P1837
2025-09-07
Commercial proprietary
Contact vendor for pricing; offers demo and trial/dashboard access; deployment on customer cloud or on‑prem (contact sales).
enterprise_quote
Kubernetes-based deployment; supports AWS, Azure, Google Cloud; cert-manager, instance types / GPU selection; uses cloud-managed storage and databases
product
1.0
{ "company_name": "YData", "company_url": "https://ydata.ai", "company_offices": [ "United States", "Portugal" ], "company_founding": "2019", "product_url": "https://ydata.ai/products/platform.html", "categories": [ "data-centric AI", "synthetic data", "data profiling", "data catalog", "data pipelines", "data quality" ], "market_segment": [ "enterprise", "SMB" ], "links": [ "https://ydata.ai/", "https://ydata.ai/products/platform.html", "https://ydata.ai/products/synthesizer.html", "https://docs.fabric.ydata.ai/", "https://trust.ydata.ai", "https://ydata.ai/company.html", "https://ydata.ai/contact-us.html", "https://elion.health/products/ydata", "https://www.g2.com/products/ydata/reviews", "https://aws.amazon.com/marketplace/pp/prodview-hgrqd5lqnqblm" ], "summary": "YData Fabric is a data‑centric AI platform that provides data profiling, quality tooling and synthetic data generation to enable safe sharing, augmentation and bias mitigation for healthcare and pharma use cases.", "description": "Commercial platform (YData Fabric and SDK) for generating statistically accurate synthetic tabular and time‑series healthcare data, profiling and data cataloging, pipelines and model‑ready dataset creation; supports on‑prem/cloud deployment to keep PHI inside customer infrastructure and is marketed to healthcare and life‑sciences organisations for data sharing, augmentation, de‑biasing and ML model development.", "target_users": [ "data scientists", "ML engineers", "clinical researchers", "biostatisticians", "data engineers", "IT/admins", "privacy/compliance officers", "product managers" ], "specialties": [ "Healthcare", "Pharma", "Clinical research", "Real‑world evidence (RWE)", "Medical imaging (supporting derived/tabular workflows)", "Genomics/omics", "Biotech" ], "regions_available": [ "Global" ], "languages_supported": [ "English" ], "pricing_model": "enterprise_quote", "pricing_details": "Contact vendor for pricing; offers demo and trial/dashboard access; deployment on customer cloud or on‑prem (contact sales).", "license": "Commercial proprietary", "deployment_model": [ "SaaS", "self-hosted (customer cloud)", "cloud-managed on AWS/Azure/GCP", "hybrid" ], "os_platforms": [ "Web UI", "Jupyter Lab (cloud/workspace)", "VS Code (web/remote)" ], "features": [ "Data catalog with automated profiling and PII detection", "Automated data profiling and quality reports", "Synthetic data generation (tabular, time-series, multi-table, text)", "Privacy controls and configurable privacy level for synthetic data", "Anonymization and conditional sampling", "Labs - on-demand development environments with configurable hardware (including GPUs)", "Pipelines - job orchestration, versioning and experiment tracking", "SDK and APIs for programmatic access (Python)", "Connectors for databases, cloud storage and data warehouses", "Integration recipes for Databricks, Snowflake, DVC, etc.", "Provisionable compute (instance type selection) and GPU support", "Secure deployment tooling (Kubernetes manifests, cert-manager, SBOM)", "Monitoring, backups and disaster recovery", "Role-based access controls and login provider integrations" ], "optional_modules": [ "Synthetic Data module", "Pipelines orchestration module", "Labs (managed dev environments)", "Data Catalog / Connectors pack", "Fabric SDK" ], "integrations": [ "Snowflake", "Databricks", "DVC", "H2O", "Algorithmia", "UbiOps", "Great Expectations", "Azure ML", "AWS SageMaker", "Google Vertex AI", "Relational databases (RDBMS connectors)", "Cloud object storage (AWS S3, GCS, Azure Blob Storage)" ], "data_standards": [], "api_available": "yes", "system_requirements": "Kubernetes-based deployment; supports AWS, Azure, Google Cloud; cert-manager, instance types / GPU selection; uses cloud-managed storage and databases", "compliance": [ "GDPR" ], "certifications": [], "security_features": [ "TLS/SSL for data in transit", "AES-256 encryption at rest", "JWT-based API authentication", "SSO/OpenID/SAML and AD integrations", "MFA/Two-step verification", "RBAC (role-based access control)", "Audit logging and monitoring", "SBOM (Secure Build Materials) availability" ], "privacy_features": [ "Synthetic data generation to avoid use of real PHI", "Configurable privacy levels for synthetic data", "Anonymization tools", "Option to keep customer data in customer cloud (data never leaves customer cloud)", "SBOM and privacy-focused deployment practices" ], "data_residency": "Customer-selectable regions (US and EU backups mentioned); supports deploying in customer's AWS/Azure/GCP region (BYO cloud region)", "customers": [ "EDP", "Igloo" ], "user_reviews": [], "ratings": [], "support_channels": [ "contact form", "documentation" ], "training_options": [ "documentation" ], "release_year": "", "integration_partners": [ "Amazon Web Services", "Google Cloud Platform", "Microsoft Azure" ], "id": "P1837", "slug": "ydata", "type": "product", "version": "1.0", "last_updated": "2025-09-07", "links_json": { "self": "https://www.healthaidb.com/software/ydata.json" } }