{"category":{"id":"data-engineering","label":"Data Engineering","kind":"topic"},"rising":[{"repo":"GokuMohandas/Made-With-ML","rank":474,"stars":48093,"velocityPerDay":71.8,"language":"Jupyter Notebook","description":"Learn how to develop, deploy and iterate on production-grade ML applications.","forks":7563,"url":"https://warpchart.dev/r/GokuMohandas/Made-With-ML"},{"repo":"DataTalksClub/data-engineering-zoomcamp","rank":596,"stars":42436,"velocityPerDay":32.6,"language":"Jupyter Notebook","description":"Data Engineering Zoomcamp is a free 9-week course on building production-ready data pipelines. The next cohort starts in January 2026. Join the course here 👇🏼","forks":8402,"url":"https://warpchart.dev/r/DataTalksClub/data-engineering-zoomcamp"},{"repo":"binhnguyennus/awesome-scalability","rank":229,"stars":71734,"velocityPerDay":20.7,"language":null,"description":"The Patterns of Scalable, Reliable, and Performant Large-Scale Systems","forks":7015,"url":"https://warpchart.dev/r/binhnguyennus/awesome-scalability"},{"repo":"umami-software/umami","rank":746,"stars":37166,"velocityPerDay":16.3,"language":"TypeScript","description":"Umami is a modern, privacy-focused analytics platform. An open-source alternative to Google Analytics, Mixpanel and Amplitude.","forks":7298,"url":"https://warpchart.dev/r/umami-software/umami"},{"repo":"PostHog/posthog","rank":836,"stars":35032,"velocityPerDay":15.2,"language":"Python","description":"🦔 PostHog is an all-in-one developer platform for building successful products. We offer product analytics, web analytics, session replay, error tracking, feat","forks":2858,"url":"https://warpchart.dev/r/PostHog/posthog"},{"repo":"grafana/grafana","rank":204,"stars":74422,"velocityPerDay":13.1,"language":"TypeScript","description":"The open and composable observability and data visualization platform. Visualize metrics, logs, and traces from multiple sources like Prometheus, Loki, Elastics","forks":14068,"url":"https://warpchart.dev/r/grafana/grafana"},{"repo":"apache/superset","rank":214,"stars":73291,"velocityPerDay":13.1,"language":"TypeScript","description":"Apache Superset is a Data Visualization and Data Exploration Platform","forks":17611,"url":"https://warpchart.dev/r/apache/superset"},{"repo":"metabase/metabase","rank":484,"stars":47680,"velocityPerDay":13.1,"language":"Clojure","description":"The easy-to-use open source Business Intelligence and Embedded Analytics tool that lets everyone work with data :bar_chart:","forks":6543,"url":"https://warpchart.dev/r/metabase/metabase"},{"repo":"duckdb/duckdb","rank":688,"stars":38779,"velocityPerDay":13.1,"language":"C++","description":"DuckDB is an analytical in-process SQL database management system","forks":3319,"url":"https://warpchart.dev/r/duckdb/duckdb"},{"repo":"langfuse/langfuse","rank":1160,"stars":29072,"velocityPerDay":12,"language":"TypeScript","description":"🪢 Open source AI engineering platform: LLM evals, observability, metrics, prompt management, playground, datasets. Integrates with OpenTelemetry, LangChain, Op","forks":3011,"url":"https://warpchart.dev/r/langfuse/langfuse"},{"repo":"ClickHouse/ClickHouse","rank":475,"stars":47996,"velocityPerDay":10.9,"language":"C++","description":"ClickHouse® is a real-time analytics database management system","forks":8512,"url":"https://warpchart.dev/r/ClickHouse/ClickHouse"},{"repo":"plausible/analytics","rank":1321,"stars":27132,"velocityPerDay":6.9,"language":"Elixir","description":"Open source, privacy-first web analytics. Lightweight, cookie-free Google Analytics alternative. Self-hosted or cloud.","forks":1629,"url":"https://warpchart.dev/r/plausible/analytics"},{"repo":"openobserve/openobserve","rank":2232,"stars":19277,"velocityPerDay":6.9,"language":"TypeScript","description":"Open source observability platform for logs, metrics, traces, frontend monitoring, pipelines and LLM observability. A sophisticated, simple and highly performan","forks":857,"url":"https://warpchart.dev/r/openobserve/openobserve"},{"repo":"apache/airflow","rank":517,"stars":45809,"velocityPerDay":6.5,"language":"Python","description":"Apache Airflow - A platform to programmatically author, schedule, and monitor workflows","forks":17238,"url":"https://warpchart.dev/r/apache/airflow"},{"repo":"apache/spark","rank":573,"stars":43453,"velocityPerDay":6.5,"language":"Scala","description":"Apache Spark - A unified analytics engine for large-scale data processing","forks":29223,"url":"https://warpchart.dev/r/apache/spark"},{"repo":"eugeneyan/applied-ml","rank":1110,"stars":29769,"velocityPerDay":5.2,"language":null,"description":"📚 Papers & tech blogs by companies sharing their work on data science & machine learning in production.","forks":3948,"url":"https://warpchart.dev/r/eugeneyan/applied-ml"},{"repo":"apache/flink","rank":1416,"stars":26080,"velocityPerDay":5.2,"language":"Java","description":"Apache Flink","forks":13956,"url":"https://warpchart.dev/r/apache/flink"},{"repo":"mindsdb/minds","rank":674,"stars":39301,"velocityPerDay":4.4,"language":"Dockerfile","description":"General-purpose AI designed for knowledge workers — creators, strategists, and operators — and individuals seeking AI systems they can truly control to help the","forks":6211,"url":"https://warpchart.dev/r/mindsdb/minds"},{"repo":"timescale/timescaledb","rank":1755,"stars":22895,"velocityPerDay":3.4,"language":"C","description":"A time-series database for high-performance real-time analytics packaged as a Postgres extension","forks":1109,"url":"https://warpchart.dev/r/timescale/timescaledb"},{"repo":"vectordotdev/vector","rank":1853,"stars":22036,"velocityPerDay":3.4,"language":"Rust","description":"A high-performance observability data pipeline.","forks":2172,"url":"https://warpchart.dev/r/vectordotdev/vector"},{"repo":"airbytehq/airbyte","rank":1947,"stars":21455,"velocityPerDay":3.4,"language":"Python","description":"Open-source data movement for ELT pipelines and AI agents — from APIs, databases & files to warehouses, lakes, and AI applications. Both self-hosted and Cloud.","forks":5218,"url":"https://warpchart.dev/r/airbytehq/airbyte"},{"repo":"apache/kafka","rank":948,"stars":32816,"velocityPerDay":2.2,"language":"Java","description":"Apache Kafka - A distributed event streaming platform","forks":15272,"url":"https://warpchart.dev/r/apache/kafka"},{"repo":"webtorrent/webtorrent","rank":1040,"stars":31026,"velocityPerDay":1.7,"language":"JavaScript","description":"⚡️ Streaming torrent client for the web","forks":2790,"url":"https://warpchart.dev/r/webtorrent/webtorrent"},{"repo":"donnemartin/data-science-ipython-notebooks","rank":1154,"stars":29166,"velocityPerDay":1.7,"language":"Python","description":"Data science Python notebooks: Deep learning (TensorFlow, Theano, Caffe, Keras), scikit-learn, Kaggle, big data (Spark, Hadoop MapReduce, HDFS), matplotlib, pan","forks":8030,"url":"https://warpchart.dev/r/donnemartin/data-science-ipython-notebooks"},{"repo":"getredash/redash","rank":1192,"stars":28640,"velocityPerDay":1.7,"language":"Python","description":"Make Your Company Data Driven. Connect to any data source, easily visualize, dashboard and share your data.","forks":4603,"url":"https://warpchart.dev/r/getredash/redash"},{"repo":"kestra-io/kestra","rank":1330,"stars":27056,"velocityPerDay":1.7,"language":"Java","description":"Event Driven Orchestration & Scheduling Platform for Mission Critical Applications","forks":2621,"url":"https://warpchart.dev/r/kestra-io/kestra"},{"repo":"PrefectHQ/prefect","rank":1785,"stars":22608,"velocityPerDay":1.7,"language":"Python","description":"Prefect is a workflow orchestration framework for building resilient data pipelines in Python.","forks":2337,"url":"https://warpchart.dev/r/PrefectHQ/prefect"},{"repo":"matomo-org/matomo","rank":1922,"stars":21596,"velocityPerDay":1.7,"language":"PHP","description":"Empowering People Ethically 🚀 — Matomo is hiring! Join us → https://matomo.org/jobs Matomo is the leading open-source alternative to Google Analytics, giving y","forks":2857,"url":"https://warpchart.dev/r/matomo-org/matomo"},{"repo":"qax-os/excelize","rank":2042,"stars":20666,"velocityPerDay":1.7,"language":"Go","description":"Go language library for reading and writing Microsoft Excel™ (XLAM / XLSM / XLSX / XLTM / XLTX) spreadsheets","forks":1910,"url":"https://warpchart.dev/r/qax-os/excelize"},{"repo":"amark/gun","rank":2266,"stars":19058,"velocityPerDay":1.7,"language":"JavaScript","description":"An open source cybersecurity protocol for syncing decentralized graph data.","forks":1239,"url":"https://warpchart.dev/r/amark/gun"}],"catalog":{"size":3000,"asOf":"2026-06-15T01:35:15.729Z"}}