{"id":"2540100753","title":"Research Engineer – Training Infra","posted_at":"2026-05-11T16:48:36.000Z","apply_url":"https://job-boards.greenhouse.io/snorkelai/jobs/5825066004","locations":["Redwood City, CA","San Francisco, CA"],"employment_type":"full_time","workplace_type":"hybrid","seniority_level":null,"description_language":"en","source_name":"greenhouse","source_url":"https://job-boards.greenhouse.io/snorkelai/jobs/5825066004","salary":{"min":180000,"max":250000,"currency":"USD","period":"year","display":"$180,000–$250,000"},"job_summary":"Snorkel AI helps enterprises transform expert knowledge into specialized AI at scale. This Applied Research Engineer role involves building and operating GPU cluster infrastructure, training pipelines, and tooling to support model training and evaluation.","job_description":{"responsibilities":["Set up and manage GPU cluster infrastructure on major cloud providers.","Build and operate job orchestration and scheduling systems for training and evaluation jobs.","Integrate and maintain ML training frameworks and post-training pipelines.","Manage experiment tracking, dataset versioning, and model artifact management.","Monitor and optimize cluster health, resource utilization, and fault tolerance.","Collaborate with research scientists and ML engineers to unblock experiments and evolve infrastructure."],"minimum_qualifications":["Hands-on experience managing GPU clusters on major cloud providers.","Experience with distributed compute orchestration tools like Kubernetes or Slurm.","Working knowledge of distributed training concepts and parallelism strategies.","Experience with ML experiment tracking and data/model versioning tools.","Strong Python proficiency and solid software engineering fundamentals.","Ability to work in a fast-moving, iterative environment."],"preferred_qualifications":["Hands-on experience with post-training workflows such as SFT or RLHF."]},"visa_sponsorship":null,"experience_years_min":null,"job_address":null,"job_city":"Redwood City","job_state":"CA","job_country":"US","location_lat":37.487103999999995,"location_lng":-122.2344428,"keywords":["distributed training","production-ready","infrastructure","generative AI","communication","Collaborate","distributed","performance","fine-tuning","fast-moving","engineering","end-to-end","production","Kubernetes","automation","priorities","pipelines","workflows","business","research","dataset","design","Growth","Python","launch","teams","local","data","RLHF","SFT","GPU","AWS","ML","AI"],"company":{"name":"Snorkel AI","logo_url":"https://img.logo.dev/snorkel.ai?token=pk_fWx5G5QrQMm-0Ud8BW3mBg&size=64&format=png","description":"Snorkel AI provides an AI data development platform that enables enterprises to build and deploy custom machine learning and generative AI models by programmatically labeling and managing their data.","website_url":"https://snorkel.ai","linkedin_url":"https://www.linkedin.com/company/snorkel-ai","glassdoor_url":"https://www.glassdoor.com/Overview/Working-at-Snorkel-AI-EI_IE5809965.11,21.htm","x_url":"https://x.com/SnorkelAI","instagram_url":"https://www.instagram.com/snorkel_ai/","youtube_url":"https://www.youtube.com/@SnorkelAI","github_url":"https://github.com/snorkel-ai","huggingface_url":"https://huggingface.co/snorkelai","tiktok_url":null,"crunchbase_url":"https://www.crunchbase.com/organization/snorkel-ai","facebook_url":"https://www.facebook.com/snorkelai/","employee_count_range":"501-1000","employee_count":729,"founded_year":2019,"headquarters":{"address":"55 Perry St, Redwood City, CA 94063, United States","city":"Redwood City, CA","country":"US","lat":37.4863239,"lng":-122.232523},"industry":"other","company_type":"startup","total_funding_usd":238000000,"locations":["New York City, NY","New York, NY","Redwood City, CA","San Francisco, CA","Seattle, WA","Washington, DC"]},"structured_data":{"@context":"https://schema.org","@type":"JobPosting","@id":"https://curastem.org/jobs/2540100753#job","title":"Research Engineer – Training Infra","description":"Snorkel AI helps enterprises transform expert knowledge into specialized AI at scale. This Applied Research Engineer role involves building and operating GPU cluster infrastructure, training pipelines, and tooling to support model training and evaluation.","datePosted":"2026-05-11T16:48:36.000Z","validThrough":"2026-06-10T16:48:36.000Z","url":"https://curastem.org/jobs/2540100753","directApply":true,"hiringOrganization":{"@type":"Organization","name":"Snorkel AI","sameAs":"https://snorkel.ai","logo":"https://img.logo.dev/snorkel.ai?token=pk_fWx5G5QrQMm-0Ud8BW3mBg&size=64&format=png"},"jobLocation":{"@type":"Place","address":{"@type":"PostalAddress","streetAddress":"55 Perry St","addressLocality":"Redwood City","addressRegion":"CA","postalCode":"94063","addressCountry":"US"}},"employmentType":"FULL_TIME","identifier":{"@type":"PropertyValue","name":"Snorkel AI","value":"2540100753"},"baseSalary":{"@type":"MonetaryAmount","currency":"USD","value":{"@type":"QuantitativeValue","minValue":180000,"maxValue":250000,"unitText":"YEAR"}}}}