python:15,sql:10,data pipelines:10,etl:5,hadoop:5,apache spark:5,big data:5,cloud computing:3,data warehousing:2,git:2,docker:2,