{
  "$schema": "https://raw.githubusercontent.com/jsonresume/resume-schema/v1.0.0/schema.json",
  "basics": {
    "name": "Nazarii Melnychuk",
    "label": "Lead Data & Applied AI Engineer",
    "summary": "Lead Data Engineer and Applied AI Engineer specializing in data-platform modernization, lakehouse architecture, and production agentic systems. Data Lead for a team of 6 engineers (grown from 2 through hands-on hiring) and lead of a 9-person cross-functional delivery team. A generalist who works primarily in Python and reads Scala, Go, and TypeScript, focused on architecture, performance, business correctness, and design elegance.",
    "url": "https://nmeln.com",
    "profiles": [
      {
        "network": "LinkedIn",
        "username": "nazarii-melnychuk-84581111b",
        "url": "https://www.linkedin.com/in/nazarii-melnychuk-84581111b"
      },
      {
        "network": "GitHub",
        "username": "nmeln",
        "url": "https://github.com/nmeln"
      },
      {
        "network": "Linktree",
        "username": "nmeln",
        "url": "https://linktr.ee/nmeln"
      }
    ]
  },
  "work": [
    {
      "name": "US adtech company",
      "position": "Data Platform Lead, Lakehouse & AI",
      "startDate": "2025-01",
      "endDate": "",
      "summary": "Lead the data platform and applied-AI initiatives for a US adtech company, owning lakehouse modernization, production reliability, and agentic AI systems while leading data engineering delivery.",
      "highlights": [
        "Spearheaded the end-to-end migration of a business-critical analytics platform from a legacy cloud warehouse and third-party analytical database to a Databricks Lakehouse, establishing a unified serving layer and removing vendor dependencies from the critical data path.",
        "Architected medallion-style data pipelines using Spark and Delta Lake: incremental ingestion, snapshot-consistent merges, granular fact models, pre-aggregations, and probabilistic counting for large-scale analytical workloads.",
        "Led controlled cutovers across data pipelines, backend APIs, frontend clients, and downstream services using automated source-versus-target parity testing and stable interface contracts; retired obsolete infrastructure and removed thousands of lines of legacy code.",
        "Delivered substantial efficiency improvements: 4–5× faster production processing, 100×+ acceleration in validated analytical prototypes, order-of-magnitude corrections to sizing logic, and recurring cloud-cost reductions.",
        "Restored correctness in complex measurement and attribution pipelines by resolving temporal-window, slowly-changing-dimension, canonicalization, deduplication, status-management, and aggregation defects.",
        "Led root-cause analysis and remediation of high-impact production incidents spanning schema inference, Unicode normalization, database connection lifecycle, distributed storage configuration, cache semantics, and accidental Cartesian joins.",
        "Built and launched an LLM-powered natural-language data discovery service from zero to production using FastAPI, agent frameworks, MCP tools, embeddings, and vector search over tens of thousands of domain attributes.",
        "Designed and productionized a Claude-powered autonomous incident-triage agent that performs permission-gated, read-only investigations, maintains an auditable activity trail, posts structured incident summaries, and opens draft documentation pull requests.",
        "Led the architecture (not implementation) of a resilient, self-learning agent-based LLM parser for adtech postlogs: scoped the stack, intermediate-result storage, off-the-shelf vs hosted OCR / bounding-box models (e.g., Datalab), clear responsibility separation from other agents in the flow, and an assessment of current SOTA approaches.",
        "Hardened agentic systems for production with structured-output validation, permission boundaries, bounded concurrency, token controls, observability, secrets management, container orchestration, and Git-based episodic memory.",
        "Applied Claude and Claude Code as engineering force multipliers for repository-scale analysis, migration planning, debugging, implementation, and documentation, backed by automated tests, data-parity checks, and human review.",
        "Automated several data-team and sprint/planning processes as reusable agent skills, converting runbooks into codified workflows with built-in confirmation steps and invariant checks."
      ]
    },
    {
      "name": "US SaaS company",
      "position": "Messaging Project",
      "startDate": "2021-10",
      "endDate": "2024-12",
      "summary": "Developed core components of omnichannel messaging platform, enabling enterprise customers to reach users across WhatsApp Business, RCS, and SMS channels through unified APIs.",
      "highlights": [
        "Implemented key parts of sender registration system supporting multiple messaging channels (WhatsApp, RCS and potentially others), handling provider-specific requirements and compliance rules.",
        "Optimized message delivery latency and reliability while maintaining complex business rules across different OTT providers.",
        "Resolved critical customer escalations through deep technical investigation and edge case analysis.",
        "Worked on updating billing logic on a critical path, ensuring accurate and timely billing for customers.",
        "Contributed to cross-team Scala, Golang and Java projects."
      ]
    },
    {
      "name": "US technology company",
      "position": "Marketing Project",
      "startDate": "2021-03",
      "endDate": "2021-10",
      "summary": "Developed and optimized Apache Spark pipelines processing cross-service engagement data with strict privacy preservation requirements across multiple digital entertainment and subscription platforms.",
      "highlights": [
        "Engineered high-performance Spark jobs processing TB-scale user engagement data.",
        "Built privacy-preserving data aggregation pipelines enabling anonymous cross-service analytics.",
        "Optimized data processing pipelines reducing job completion times while ensuring data minimization principles.",
        "Documented dataset lineage and data flow for compliance and reproducibility."
      ]
    },
    {
      "name": "US healthcare technology company",
      "position": "Healthcare Project",
      "startDate": "2020-05",
      "endDate": "2021-03",
      "summary": "Played key role in modernizing healthcare data processing platform, enabling efficient transformation of diverse medical records into analytics-ready formats for business intelligence.",
      "highlights": [
        "Transformed legacy Python batch jobs into scalable Apache Spark workflows, migrating complex healthcare data processing logic.",
        "Designed and implemented production-grade ETL pipelines handling diverse healthcare data formats from multiple source systems.",
        "Optimized large-scale data reprocessing jobs reducing execution time while ensuring HIPAA compliance.",
        "Developed automated AWS S3 to Redshift data pipeline using PySpark and boto3, enabling real-time BI reporting.",
        "Contributed significant technical input to architecture decisions affecting multiple project initiatives."
      ]
    },
    {
      "name": "Israel adtech company",
      "position": "Adtech Project",
      "startDate": "2019-10",
      "endDate": "2020-05",
      "summary": "Developed real-time ad analytics platform processing high-volume impression data (670+ MPS) to enable automated bidding decisions and campaign optimization.",
      "highlights": [
        "Implemented Spark Structured Streaming jobs for real-time ad performance analysis",
        "Optimized data processing architecture reducing operational costs while maintaining system reliability",
        "Modernized legacy Python ETL pipelines to improve maintainability and processing efficiency"
      ]
    },
    {
      "name": "US SaaS company",
      "position": "Communications Project",
      "startDate": "2018-02",
      "endDate": "2019-10",
      "summary": "Developed high-throughput streaming applications for SMS data processing, implementing complex rate calculation logic and generating business intelligence insights.",
      "highlights": [
        "Optimized messaging metadata enrichment pipeline during Kinesis-to-Kafka migration, achieving 830+ MPS through elimination of processing redundancies.",
        "Implemented comprehensive cross-stream validation to ensure data consistency between source systems during the transition.",
        "Built cost-effective internal services replacing external API dependencies, resulting in significant operational savings",
        "Led Scala knowledge-sharing initiatives including mentoring sessions and technical workshops"
      ]
    },
    {
      "name": "US energy company",
      "position": "Digital Transformation Project",
      "startDate": "2017-06",
      "endDate": "2017-12",
      "summary": "Contributed to enterprise-wide data modernization initiative, migrating traditional database workloads to cloud-based big data processing platform.",
      "highlights": [
        "Replaced legacy Oracle and MySQL batch processes with scalable Apache Spark pipelines",
        "Built new data processing workflows using Spark SQL and Hive, eliminating dependency on legacy SQL jobs"
      ]
    },
    {
      "name": "European food and beverage companies",
      "position": "IoT Monitoring Platform",
      "startDate": "2015-11",
      "endDate": "2017-06",
      "summary": "Developed real-time monitoring system processing data from IoT sensors across warehouse and retail locations, enabling predictive maintenance and inventory optimization.",
      "highlights": [
        "Implemented scalable data processing pipelines using Apache Spark and Akka Streams to handle real-time sensor data",
        "Built diagnostic tools enabling QA and hardware teams to validate device performance and data accuracy",
        "Developed anomaly detection system for early identification of hardware issues"
      ]
    }
  ],
  "education": [
    {
      "institution": "Lviv Polytechnic National University",
      "area": "Computer Science",
      "studyType": "MSc Degree",
      "startDate": "2016",
      "endDate": "2017",
      "location": "Ukraine"
    },
    {
      "studyType": "Course",
      "area": "Natural Language Processing & AI",
      "startDate": "2023",
      "endDate": "",
      "courses": [
        "Contributed Ukrainian localization and dataset improvements to OpenAssistant/oasst1 open-source project",
        "Built practical applications using transformer models and HuggingFace libraries",
        "Explored large language models and their enterprise applications"
      ]
    },
    {
      "studyType": "Course",
      "area": "Deep Learning & Time Series Analysis",
      "startDate": "2022",
      "endDate": "",
      "courses": [
        "Completed fast.ai's Practical Deep Learning for Coders course",
        "Implemented time-series forecasting solutions using Facebook's Prophet",
        "Applied deep learning techniques to real-world data problems"
      ]
    }
  ],
  "skills": [
    {
      "name": "Languages",
      "keywords": [
        "Python (primary)",
        "Scala",
        "Go",
        "TypeScript"
      ]
    },
    {
      "name": "Data & Lakehouse",
      "keywords": [
        "Databricks",
        "Delta Lake",
        "Apache Spark",
        "Apache Kafka",
        "Airflow"
      ]
    },
    {
      "name": "Applied AI",
      "keywords": [
        "LLMs",
        "Claude / Claude Code",
        "MCP",
        "FastMCP",
        "Embeddings",
        "Vector search",
        "FastAPI"
      ]
    },
    {
      "name": "Agent SDKs",
      "keywords": [
        "OpenAI Agents SDK",
        "Claude Agent SDK",
        "Inngest AgentKit"
      ]
    },
    {
      "name": "Data Warehousing & Analytics",
      "keywords": [
        "Amazon Redshift",
        "BigQuery",
        "Amazon Athena",
        "ElasticSearch",
        "pandas"
      ]
    },
    {
      "name": "Databases",
      "keywords": [
        "PostgreSQL",
        "Amazon RDS",
        "ElastiCache: Redis / Valkey"
      ]
    },
    {
      "name": "Cloud & Infrastructure",
      "keywords": [
        "AWS (EMR, Lambda, SQS, Aurora)",
        "Docker",
        "K8S",
        "Datadog"
      ]
    }
  ],
  "languages": [
    {
      "language": "English",
      "fluency": "Advanced"
    }
  ],
  "projects": [
    {
      "name": "real-time FTMS logging and workout tracker for my air bike",
      "description": "A real-time FTMS logging and workout tracker for my air bike, with heart-rate and cadence support and data export."
    },
    {
      "name": "high-performance 180° and 360° panorama and stereo-image viewer for the Meta Quest VR headset",
      "description": "A high-performance 180° and 360° panorama and stereo-image viewer for the Meta Quest VR headset, with mipmap support and low latency."
    },
    {
      "name": "Automation of personal workflows with a Nous Hermes agent",
      "description": "Automation of personal workflows with a Nous Hermes agent, through custom-built skills and purpose-built mini-apps."
    }
  ],
  "meta": {
    "canonical": "https://nmeln.com/resume.json",
    "lastModified": "2026-06-21T16:57:10.172Z"
  }
}