JSON twin: https://www.healthaidb.com/software/mostly-ai.json
MOSTLY AI
https://mostly.ai/synthetic-data-platform
MOSTLY AI is a synthetic data platform and open-source SDK that generates high-fidelity, privacy-preserving structured and text data for AI/ML, analytics, testing and data sharing in regulated environments such as healthcare and life sciences.
Enterprise-ready data intelligence platform plus a permissive open-source Synthetic Data SDK (Apache 2.0) that trains generative models for tabular, time-series and text data. Provides local or cloud deployment, built-in privacy controls (differential privacy, privacy/fidelity reports), exportable generators, integrations with data platforms (e.g., Databricks, AWS marketplace), and compliance posture including SOC 2 and HIPAA support for healthcare use cases.
yes
2017
Options for on-prem/private-cloud/air-gapped deployments; regional cloud hosting options (EU and other regions supported)
P1085
2025-09-07
SDK: Apache-2.0 (open source); Platform: commercial/proprietary (enterprise license)
Contact vendor for enterprise pricing; offers free tier/SDK for evaluation and a start-for-free option for the platform—request demo or sign up on vendor site.
enterprise_quote
2017
SaaS-hosted or on-prem/private-cloud (air-gapped) deployments; Python runtime for SDK
product
1.0
{ "company_name": "MOSTLY AI", "company_url": "https://mostly.ai", "company_offices": [ "Austria", "United States" ], "company_founding": "2017", "product_url": "https://mostly.ai/synthetic-data-platform", "categories": [ "data anonymization", "synthetic data", "analytics", "AI/ML training", "testing & QA", "data sharing", "simulated data" ], "market_segment": [ "enterprise", "smb" ], "links": [ "https://mostly.ai", "https://mostly.ai/synthetic-data-platform", "https://mostly.ai/features", "https://mostly.ai/docs", "https://mostly.ai/privacy", "https://mostly.ai/pricing", "https://elion.health/products/mostly-ai", "https://www.g2.com/products/mostly-ai-synthetic-data-platform/reviews", "https://www.linkedin.com/company/mostlyai", "https://mostly.ai/imprint" ], "summary": "MOSTLY AI is a synthetic data platform and open-source SDK that generates high-fidelity, privacy-preserving structured and text data for AI/ML, analytics, testing and data sharing in regulated environments such as healthcare and life sciences.", "description": "Enterprise-ready data intelligence platform plus a permissive open-source Synthetic Data SDK (Apache 2.0) that trains generative models for tabular, time-series and text data. Provides local or cloud deployment, built-in privacy controls (differential privacy, privacy/fidelity reports), exportable generators, integrations with data platforms (e.g., Databricks, AWS marketplace), and compliance posture including SOC 2 and HIPAA support for healthcare use cases.", "target_users": [ "data scientists", "ML engineers", "healthcare analytics teams", "clinical researchers", "IT/data engineering", "product/QA teams", "compliance/privacy teams", "life sciences researchers" ], "specialties": [ "healthcare analytics", "clinical research", "pharma / life sciences", "payer analytics", "hospital & health system data", "software testing / QA" ], "regions_available": [ "United States", "European Union", "United Kingdom", "Canada", "Australia", "Global" ], "languages_supported": [ "English" ], "pricing_model": "enterprise_quote", "pricing_details": "Contact vendor for enterprise pricing; offers free tier/SDK for evaluation and a start-for-free option for the platform—request demo or sign up on vendor site.", "license": "SDK: Apache-2.0 (open source); Platform: commercial/proprietary (enterprise license)", "deployment_model": [ "SaaS", "on_prem", "private_cloud", "air_gapped" ], "os_platforms": [ "Web", "Linux", "macOS", "Windows" ], "features": [ "synthetic data generation (realistic, stat-preserving)", "privacy-by-design default anonymization", "Synthetic Data SDK", "model overfitting prevention", "rare category protection", "extreme value protection", "extreme sequence length protection", "random-draw synthesis", "mock data generation for testing/QA", "simulated data / data-driven simulations", "data sharing / data democratization tooling", "privacy configuration defaults", "privacy protection validation and metrics", "AI Assistant (data-native workspace)" ], "optional_modules": [ "AI Assistant", "Synthetic Data SDK (client-side SDKs)", "Simulated Data module", "Mock Data module" ], "integrations": [], "data_standards": [], "api_available": "yes", "system_requirements": "SaaS-hosted or on-prem/private-cloud (air-gapped) deployments; Python runtime for SDK", "compliance": [ "GDPR", "CCPA/CPRA", "HIPAA", "PDPA", "APPI", "SOC 2", "ISO 27001" ], "certifications": [ "SOC 2 Type II", "ISO 27001" ], "security_features": [ "encryption in transit and at rest", "role-based access control (RBAC)", "SSO / Keycloak-based authentication (SAML/OIDC)", "audit logs", "model memorization/overfitting protections", "2FA" ], "privacy_features": [ "default anonymization / privacy-by-design", "rare category substitution", "extreme value removal", "sequence length protection", "privacy-preserving model training and validation" ], "data_residency": "Options for on-prem/private-cloud/air-gapped deployments; regional cloud hosting options (EU and other regions supported)", "customers": [ "City of Vienna", "Telefonica", "Erste Group", "New York-Presbyterian (referenced case)", "Unnamed Fortune 100 bank (referenced case)" ], "user_reviews": [ "Helps maintain customer privacy and I can assure my customers that their sensitive data is safe.", "Interface is easy to use — I don't have to write code to produce high-quality synthesized data.", "High-fidelity synthetic data that preserves analytic value while protecting PII.", "Useful for testing and sharing data with third parties without privacy risk." ], "ratings": [ "G2: 4.5/5 (approx. 17 reviews)", "AWS Marketplace: positive user reviews (no consolidated score)" ], "support_channels": [ "email", "ticketing", "community" ], "training_options": [ "documentation", "webinars", "live_online" ], "release_year": "2017", "integration_partners": [ "AWS Marketplace", "GitHub (MOSTLY AI Synthetic Data SDK)" ], "id": "P1085", "slug": "mostly-ai", "type": "product", "version": "1.0", "last_updated": "2025-09-07", "links_json": { "self": "https://www.healthaidb.com/software/mostly-ai.json" } }