{"version":"0.1","company":{"name":"YubHub","url":"https://yubhub.co","jobsUrl":"https://yubhub.co/jobs/skill/bare-metal-infrastructure"},"x-facet":{"type":"skill","slug":"bare-metal-infrastructure","display":"Bare Metal Infrastructure","count":1},"x-feed-size-limit":100,"x-feed-sort":"enriched_at desc","x-feed-notice":"This feed contains at most 100 jobs (the most recently enriched). For the full corpus, use the paginated /stats/by-facet endpoint or /search.","x-generator":"yubhub-xml-generator","x-rights":"Free to redistribute with attribution: \"Data by YubHub (https://yubhub.co)\"","x-schema":"Each entry in `jobs` follows https://schema.org/JobPosting. YubHub-native raw fields carry `x-` prefix.","jobs":[{"@context":"https://schema.org","@type":"JobPosting","identifier":{"@type":"PropertyValue","name":"YubHub","value":"job_a2e88648-d1d"},"title":"Mistral Cloud - Site Reliability Engineer","description":"<p>We are seeking highly experienced Site Reliability Engineers (SRE) to shape the reliability, scalability and performance of our Cloud platform and customer facing applications.</p>\n<p>You will work closely with our software engineers and product teams to ensure our systems meet and exceed our internal and external customers&#39; expectations.</p>\n<p>Key responsibilities include:</p>\n<ul>\n<li>Design, build, and maintain scalable, highly available and fault-tolerant infrastructures</li>\n<li>Operate systems and troubleshoot issues in production environments</li>\n<li>Implement and improve monitoring, alerting, and incident response systems</li>\n<li>Implement and maintain workflows and tools for both our customer-facing APIs and large training runs</li>\n</ul>\n<p>Development responsibilities include:</p>\n<ul>\n<li>Drive continuous improvement in infrastructure automation, deployment, and orchestration</li>\n<li>Collaborate with software engineers to develop and implement solutions that enable safe and reproducible model-training experiments</li>\n<li>Help build a cloud platform offering an abstraction layer between science, engineering and infrastructure</li>\n<li>Design and develop new workflows and tooling to improve the reliability, availability and performance of our systems</li>\n</ul>\n<p>Additional responsibilities include:</p>\n<ul>\n<li>Collaborate with the security team to ensure infrastructure adheres to best security practices and compliance requirements</li>\n<li>Document processes and procedures to ensure consistency and knowledge sharing across the team</li>\n<li>Contribute to open-source projects, research publications, blog articles and conferences</li>\n</ul>\n<p>About you:</p>\n<ul>\n<li>Master’s degree in Computer Science, Engineering or a related field</li>\n<li>5+ years of experience in a DevOps/SRE role</li>\n<li>Strong experience with bare metal infrastructure and highly available distributed systems</li>\n<li>Exposure to site reliability issues in critical environments</li>\n<li>Experience working against reliability KPIs</li>\n<li>Hands-on experience with CI/CD, containerization and orchestration tools</li>\n<li>Knowledge of monitoring, logging, alerting and observability tools</li>\n<li>Familiarity with infrastructure-as-code tools</li>\n<li>Proficiency in scripting languages and knowledge of software development best practices</li>\n<li>Strong understanding of networking, security, and system administration concepts</li>\n<li>Excellent problem-solving and communication skills</li>\n</ul>\n<p>Your application will be all the more interesting if you also have:</p>\n<ul>\n<li>Experience in an AI/ML environment</li>\n<li>Experience of high-performance computing (HPC) systems and workload managers</li>\n<li>Worked with modern AI-oriented solutions</li>\n</ul>\n<p style=\"margin-top:24px;font-size:13px;color:#666;\">XML job scraping automation by <a href=\"https://yubhub.co\">YubHub</a></p>","url":"https://yubhub.co/jobs/job_a2e88648-d1d","directApply":true,"hiringOrganization":{"@type":"Organization","name":"Mistral AI","sameAs":"https://mistral.ai","logo":"https://logos.yubhub.co/mistral.ai.png"},"x-apply-url":"https://jobs.lever.co/mistral/f76907fd-428a-4824-a1cf-8013974fde29","x-work-arrangement":"remote","x-experience-level":"senior","x-job-type":"full-time","x-salary-range":null,"x-skills-required":["bare metal infrastructure","highly available distributed systems","CI/CD","containerization","orchestration tools","monitoring","logging","alerting","observability tools","infrastructure-as-code tools","scripting languages","software development best practices","networking","security","system administration"],"x-skills-preferred":["AI/ML environment","high-performance computing (HPC) systems","workload managers","modern AI-oriented solutions"],"datePosted":"2026-04-17T12:47:48.920Z","jobLocation":{"@type":"Place","address":{"@type":"PostalAddress","addressLocality":"Paris"}},"jobLocationType":"TELECOMMUTE","employmentType":"FULL_TIME","occupationalCategory":"Engineering","industry":"Technology","skills":"bare metal infrastructure, highly available distributed systems, CI/CD, containerization, orchestration tools, monitoring, logging, alerting, observability tools, infrastructure-as-code tools, scripting languages, software development best practices, networking, security, system administration, AI/ML environment, high-performance computing (HPC) systems, workload managers, modern AI-oriented solutions"}]}