JSON twin: https://www.healthaidb.com/software/snowplow.json
Snowplow
https://snowplow.io/customer-data-infrastructure
Snowplow is a customer data infrastructure (behavioral data platform) that captures, enriches and delivers event-level behavioral data to your cloud data platform in real time for analytics, personalization and AI use cases.
Snowplow provides event tracking, real-time data pipelines, enrichment, data modeling and activation (reverse ETL, event forwarding, Signals) enabling teams to build governed, high-fidelity customer data inside their own cloud stack (warehouses, lakes, streams). It is offered as open-source software and as managed/cloud (BDP) deployments with enterprise security and compliance options (including HIPAA, GDPR, ISO 27001).
yes
2012
Private Managed Cloud: customer-owned cloud account/VPC on AWS, GCP, or Azure (data stays in your infra); or Snowplow BDP Cloud (region options vary).
P1526
2025-09-07
Open-source core (Apache-2.0) + commercial/proprietary for managed/cloud offerings
Pricing varies by monthly event volume, deployment (self-hosted vs managed BDP), hosting preferences and selected features; contact vendor for quote.
enterprise_quote
2012
—
For Private Managed Cloud: customer cloud account/VPC on AWS, GCP, or Azure; destination warehouse/lake/stream (Snowflake, BigQuery, Databricks, S3, Kafka, etc.).
product
1.0
{ "company_name": "Snowplow", "company_url": "https://snowplow.io", "company_offices": [ "United Kingdom", "United States" ], "company_founding": "2012", "product_url": "https://snowplow.io/customer-data-infrastructure", "categories": [ "analytics", "customer data infrastructure", "event tracking", "data pipeline", "data engineering" ], "market_segment": [ "enterprise", "smb" ], "links": [ "https://snowplow.io", "https://snowplow.io/about-us", "https://snowplow.io/customer-data-infrastructure", "https://docs.snowplow.io/docs", "https://snowplow.io/integrations-catalog", "https://snowplow.io/security", "https://snowplow.io/pricing", "https://snowplow.io/contact-us", "https://www.g2.com/products/snowplow/reviews", "https://github.com/snowplow/snowplow" ], "summary": "Snowplow is a customer data infrastructure (behavioral data platform) that captures, enriches and delivers event-level behavioral data to your cloud data platform in real time for analytics, personalization and AI use cases.", "description": "Snowplow provides event tracking, real-time data pipelines, enrichment, data modeling and activation (reverse ETL, event forwarding, Signals) enabling teams to build governed, high-fidelity customer data inside their own cloud stack (warehouses, lakes, streams). It is offered as open-source software and as managed/cloud (BDP) deployments with enterprise security and compliance options (including HIPAA, GDPR, ISO 27001).", "target_users": [ "data engineers", "data scientists", "product managers", "analytics teams", "marketing teams", "software engineers", "IT/admins" ], "specialties": [], "regions_available": [ "United States", "United Kingdom", "European Union", "Canada", "Australia", "Global" ], "languages_supported": [ "English" ], "pricing_model": "enterprise_quote", "pricing_details": "Pricing varies by monthly event volume, deployment (self-hosted vs managed BDP), hosting preferences and selected features; contact vendor for quote.", "license": "Open-source core (Apache-2.0) + commercial/proprietary for managed/cloud offerings", "deployment_model": [ "private_managed_cloud", "managed_cloud (BDP Cloud)", "self-hosted / community edition" ], "os_platforms": [ "Web", "Android", "iOS", "Node.js", "Linux (server)" ], "features": [ "Event tracking (35+ trackers)", "Data pipeline: collection, validation, enrichment, transformation", "Real-time event forwarding (Pub/Sub, Kinesis, Kafka, SQS, HTTP)", "Warehouse-first delivery to Snowflake/BigQuery/Databricks/S3/Delta Lake", "Data Product Studio (cataloging, schema management)", "Data quality monitoring and alerts", "Unified event schema / single structured events table", "Profiles store / real-time user context", "Interventions (real-time engagement engine)", "Reverse ETL / warehouse-native syncs", "Pre-built data model packs and dbt models", "Integrations catalog and extensible enrichments", "Composable architecture (decoupled collection/enrichment/delivery)", "Type-safe code generation and pre-production testing", "Anonymization & PII pseudonymization" ], "optional_modules": [ "Profiles Store", "Interventions", "Data Model Packs", "Data Product Studio", "Event Forwarding", "Accelerators (pre-built recipes)" ], "integrations": [ "Snowflake", "Google BigQuery", "Databricks", "Amazon S3", "Delta Lake", "Apache Kafka", "Google Pub/Sub", "AWS Kinesis", "AWS SQS", "HTTP endpoints", "Census (reverse ETL)" ], "data_standards": [], "api_available": "yes", "system_requirements": "For Private Managed Cloud: customer cloud account/VPC on AWS, GCP, or Azure; destination warehouse/lake/stream (Snowflake, BigQuery, Databricks, S3, Kafka, etc.).", "compliance": [ "ISO 27001", "GDPR", "CCPA", "HIPAA-eligible (BAA available)" ], "certifications": [ "ISO 27001" ], "security_features": [ "SAML SSO (major IdPs including Microsoft Entra ID, Okta)", "Access controls / RBAC for console features", "Vulnerability and anomaly detection", "Regular penetration testing", "In-stream IP anonymization / PII pseudonymization", "Encryption (in transit and at-rest implied)" ], "privacy_features": [ "Business Associate Addendum (BAA) available", "IP anonymization", "PII pseudonymization", "Basis-for-tracking / consent context per event", "Anonymous / cookieless tracking option" ], "data_residency": "Private Managed Cloud: customer-owned cloud account/VPC on AWS, GCP, or Azure (data stays in your infra); or Snowplow BDP Cloud (region options vary).", "customers": [ "HelloFresh", "Transavia", "Engel & Völkers", "Supercell", "Strava", "Burberry", "Secret Escapes", "CarTrawler", "Kindred Group", "HeyJobs", "Trinny London", "Digital Virgo", "Animoto", "Auto Trader", "Bizzabo", "DPG Media", "Gousto", "JustWatch", "La Presse", "Omio", "Pebmed", "Picnic", "Software.com", "Tripaneer", "Tourlane", "Welcome to the Jungle" ], "user_reviews": [ "Lets us store very granular data about customer interactions with our site.", "Their support and pipeline management is awesome — I'd recommend having them manage that for you.", "Snowplow was a game changer in our understanding of our customer behaviour.", "Open source so you get full access to the data and can customize as needed.", "Powerful and flexible but can be complex to set up and requires engineering resources.", "Real-time delivery into our warehouse made advanced analytics and personalization possible.", "Excellent for building a governed, first-party behavioral data layer.", "High-quality event data and great observability of the pipeline.", "Good for companies that want full control of their data rather than a black-box CDP.", "Support team knowledgeable; managed pipeline option removes operational burden." ], "ratings": [ "Capterra: 5.0/5 (aggregate listed score)", "TrustRadius: 10/10 (Snowplow Insights listings)", "Software Advice: Functionality 4.4 / Ease of Use 4.1 / Customer Support 4.9 (reported)", "AWS Marketplace: Positive customer reviews (various) referenced from marketplace listings" ], "support_channels": [ "email", "ticketing", "community", "documentation", "GitHub" ], "training_options": [ "documentation", "webinars", "live_online (demos)", "10-minute product demos/events" ], "release_year": "2012", "integration_partners": [ "AWS", "Databricks", "Snowflake", "Google BigQuery / Google Cloud Platform", "Microsoft Azure", "Confluent / Kafka", "Amazon S3", "Delta Lake", "Census", "Databricks Delta", "BigQuery", "Kafka" ], "id": "P1526", "slug": "snowplow", "type": "product", "version": "1.0", "last_updated": "2025-09-07", "links_json": { "self": "https://www.healthaidb.com/software/snowplow.json" } }