{"version":"0.1","company":{"name":"YubHub","url":"https://yubhub.co","jobsUrl":"https://yubhub.co/jobs/skill/semantic-search"},"x-facet":{"type":"skill","slug":"semantic-search","display":"Semantic Search","count":5},"x-feed-size-limit":100,"x-feed-sort":"enriched_at desc","x-feed-notice":"This feed contains at most 100 jobs (the most recently enriched). For the full corpus, use the paginated /stats/by-facet endpoint or /search.","x-generator":"yubhub-xml-generator","x-rights":"Free to redistribute with attribution: \"Data by YubHub (https://yubhub.co)\"","x-schema":"Each entry in `jobs` follows https://schema.org/JobPosting. YubHub-native raw fields carry `x-` prefix.","jobs":[{"@context":"https://schema.org","@type":"JobPosting","identifier":{"@type":"PropertyValue","name":"YubHub","value":"job_3e231b3e-949"},"title":"Forward Deployed AI Engineering Manager, Enterprise","description":"<p>As a Forward Deployed AI Engineering Manager on our Enterprise team, you&#39;ll be the technical bridge between Scale AI&#39;s cutting-edge AI capabilities and our most strategic customers.</p>\n<p>You&#39;ll work with enterprise clients to understand their unique challenges, lead a team that architects specific AI solutions, and ensure successful deployment and adoption of AI systems in production environments.</p>\n<p>This is a Management role that combines deep engineering and AI expertise, leading a team, and working on customer-facing problems. You&#39;ll work directly with customer engineering teams to integrate AI into their critical workflows.</p>\n<p><strong>Customer Integration &amp; Deployment</strong></p>\n<p>Partner directly with enterprise customers to understand their technical infrastructure, data pipelines, and business requirements.</p>\n<p>Design and implement custom integrations between Scale AI&#39;s platform and customer data environments (cloud platforms, data warehouses, internal APIs).</p>\n<p>Build robust data connectors and ETL pipelines to ingest, process, and prepare customer data for AI workflows.</p>\n<p>Deploy and configure AI models and agents within customer security and compliance boundaries.</p>\n<p><strong>AI Agent Development</strong></p>\n<p>Develop production-grade AI agents tailored to customer use cases across domains like customer support, data analysis, content generation, and workflow automation.</p>\n<p>Architect multi-agent systems that orchestrate between different models, tools, and data sources.</p>\n<p>Implement evaluation frameworks to measure agent performance and iterate toward business objectives.</p>\n<p>Design human-in-the-loop workflows and feedback mechanisms for continuous agent improvement.</p>\n<p><strong>Prompt Engineering &amp; Optimization</strong></p>\n<p>Create sophisticated prompt engineering strategies optimized for customer-specific domains and data.</p>\n<p>Build and maintain prompt libraries, templates, and best practices for customer use cases.</p>\n<p>Conduct systematic prompt experimentation and A/B testing to improve model outputs.</p>\n<p>Implement RAG (Retrieval Augmented Generation) systems and fine-tuning pipelines where appropriate.</p>\n<p><strong>Leadership &amp; Collaboration</strong></p>\n<p>Serve as the Engineering Manager and technical point of contact for strategic enterprise accounts.</p>\n<p>Lead a team that is collaborating with customer data scientists, ML engineers, and software developers to ensure smooth integration.</p>\n<p>Work closely with Scale&#39;s product and engineering teams to translate customer needs into product improvements.</p>\n<p>Document technical architectures, integration patterns, and best practices.</p>\n<p><strong>Problem Solving &amp; Innovation</strong></p>\n<p>Debug complex technical issues across the entire stack, from data pipelines to model outputs.</p>\n<p>Rapidly prototype solutions to unblock customers and prove out new use cases.</p>\n<p>Stay current on the latest AI/ML research and tools, bringing innovative approaches to customer problems.</p>\n<p>Identify opportunities for productization based on common customer patterns.</p>\n<p style=\"margin-top:24px;font-size:13px;color:#666;\">XML job scraping automation by <a href=\"https://yubhub.co\">YubHub</a></p>","url":"https://yubhub.co/jobs/job_3e231b3e-949","directApply":true,"hiringOrganization":{"@type":"Organization","name":"Scale AI","sameAs":"https://scale.com/","logo":"https://logos.yubhub.co/scale.com.png"},"x-apply-url":"https://job-boards.greenhouse.io/scaleai/jobs/4602177005","x-work-arrangement":"hybrid","x-experience-level":"executive","x-job-type":"full-time","x-salary-range":"$216,000-$270,000 USD","x-skills-required":["Python","Production","Data Structures","Algorithms","System Design","Cloud Platforms","Modern Data Infrastructure","Problem-Solving","Communication"],"x-skills-preferred":["LLMs","Prompting Techniques","Embeddings","RAG Architectures","Vector Databases","Semantic Search Systems","Containerization","CI/CD Pipelines","Terraform","Bicep","Infrastructure as Code"],"datePosted":"2026-04-18T15:56:13.908Z","jobLocation":{"@type":"Place","address":{"@type":"PostalAddress","addressLocality":"San Francisco, CA; New York, NY"}},"employmentType":"FULL_TIME","occupationalCategory":"Engineering","industry":"Technology","skills":"Python, Production, Data Structures, Algorithms, System Design, Cloud Platforms, Modern Data Infrastructure, Problem-Solving, Communication, LLMs, Prompting Techniques, Embeddings, RAG Architectures, Vector Databases, Semantic Search Systems, Containerization, CI/CD Pipelines, Terraform, Bicep, Infrastructure as Code","baseSalary":{"@type":"MonetaryAmount","currency":"USD","value":{"@type":"QuantitativeValue","minValue":216000,"maxValue":270000,"unitText":"YEAR"}}},{"@context":"https://schema.org","@type":"JobPosting","identifier":{"@type":"PropertyValue","name":"YubHub","value":"job_77ff2013-8f9"},"title":"Senior Product Manager, Context Engineering","description":"<p>ZoomInfo is where careers accelerate. We move fast, think boldly, and empower you to do the best work of your life. As a Senior Product Manager, Context Engineering, you&#39;ll be surrounded by teammates who care deeply, challenge each other, and celebrate wins.</p>\n<p>With tools that amplify your impact and a culture that backs your ambition, you won&#39;t just contribute. You&#39;ll make things happen–fast.</p>\n<p><strong>The Opportunity:</strong></p>\n<p>ZoomInfo built the industry&#39;s most sophisticated GTM data acquisition infrastructure. Now we&#39;re applying that same rigor to context engineering,the emerging discipline that determines whether AI systems deliver transformative value or incremental improvement.</p>\n<p>This role architects the context layer powering our AI intelligence across Copilot, GTM Studio, and MarketingOS. You&#39;ll transform how ZoomInfo&#39;s agentic workflows access, compress, and deliver precisely the right information at exactly the right moment.</p>\n<p>The impact is organization-wide: every AI interaction, every intelligent recommendation, every autonomous agent action depends on the context infrastructure you’ll build.</p>\n<p>We&#39;ve transitioned to AI-first product thinking company-wide. The context pipelines exist but remain nascent,creating a rare opportunity to define architectural patterns and platform standards that compound value across multiple product teams in the years to come.</p>\n<p><strong>What You&#39;ll Do:</strong></p>\n<p>Architect Context Acquisition Pipelines</p>\n<p>Design and optimize how ZoomInfo retrieves, transforms, and delivers context from our semantic data layer, memory systems, and data producers. You&#39;ll balance retrieval quality against latency and cost constraints, implementing hybrid search strategies, intelligent caching, and context compression techniques that maintain information density while respecting token budgets.</p>\n<p>Own the Context Layer Platform</p>\n<p>Build infrastructure serving multiple product teams,Copilot, GTM Studio, MarketingOS,as internal customers. Establish API contracts, developer experience standards, and integration patterns that accelerate feature velocity.</p>\n<p>Maintain the delicate balance between providing flexible building blocks and opinionated solutions that encode best practices.</p>\n<p>Drive Quality Through Measurement</p>\n<p>Implement evaluation frameworks using RAGAS metrics and custom benchmarks. Monitor retrieval precision, context relevance, hallucination rates, and system performance in production.</p>\n<p>Translate quality signals into architectural improvements, working closely with ML engineers to iterate on embedding models, reranking strategies, and retrieval algorithms.</p>\n<p>Navigate Emerging Research</p>\n<p>Context engineering evolves weekly. You&#39;ll continuously evaluate innovations,GraphRAG for multi-hop reasoning, test-time compute scaling, multimodal retrieval, compression techniques,determining which advances warrant production investment versus which remain academic curiosities.</p>\n<p>Bring external best practices to ZoomInfo while contributing learnings back to the broader community.</p>\n<p>Orchestrate Cross-Functional Execution</p>\n<p>Translate between three distinct worlds: ML engineers optimizing retrieval algorithms, platform engineers building scalable infrastructure, and product teams shipping customer features.</p>\n<p>Establish communication cadences, prioritization frameworks, and decision-making processes that balance urgent requests against strategic platform development.</p>\n<p><strong>What You’ll Bring:</strong></p>\n<ul>\n<li>4-6 years of product management experience with 2+ years in ML/AI infrastructure</li>\n</ul>\n<ul>\n<li>Direct experience with production RAG systems, vector databases, or semantic search, context management</li>\n</ul>\n<ul>\n<li>Experience with graph databases (e.g. Neo4j)</li>\n</ul>\n<ul>\n<li>Track record building platform products serving multiple internal or external customers</li>\n</ul>\n<ul>\n<li>Familiarity with context compression, embedding models, and retrieval evaluation frameworks</li>\n</ul>\n<ul>\n<li>History of defining product vision in nascent technical domains where best practices are still emerging</li>\n</ul>\n<p><strong>Who You Are:</strong></p>\n<p>Technical Foundation</p>\n<p>Expert-level understanding of RAG system architecture,you can discuss embedding dimensionality trade-offs, vector database indexing strategies, and reranking approaches with depth.</p>\n<p>You&#39;ve built or significantly contributed to production retrieval systems, not just managed them at arm&#39;s length.</p>\n<p>Python and SQL proficiency enables you to review code, analyze retrieval issues, and prototype solutions for concept validation.</p>\n<p>Platform Product Mindset</p>\n<p>Experience building infrastructure products where internal engineering teams are your customers.</p>\n<p>You measure success through downstream product velocity improvements and developer satisfaction scores, not just uptime metrics.</p>\n<p>You understand platform economics,how each additional team using your infrastructure increases its value through shared learnings and amortized costs.</p>\n<p>Intellectual Velocity</p>\n<p>You read recent research papers from arXiv, ACL, NeurIPS.</p>\n<p>You prototype emerging techniques to understand their practical constraints.</p>\n<p>You maintain strong opinions weakly held, updating your architectural assumptions as evidence accumulates.</p>\n<p>The discipline moves too fast for static expertise,continuous learning is non-negotiable.</p>\n<p>Strategic Communication</p>\n<p>You translate between technical depth and business impact fluently.</p>\n<p>You can explain to executives why implementing GraphRAG takes 6 months but unlocks $10M in product capabilities.</p>\n<p>You can communicate to engineers why business constraints require shipping &#39;good enough&#39; in 3 weeks rather than &#39;optimal&#39; in 3 months.</p>\n<p>You influence without formal authority through data, clear reasoning, and earned credibility.</p>\n<p><strong>The Environment:</strong></p>\n<p>Reporting &amp; Collaboration</p>\n<p>Report to the Senior Product Director for Context Engineering, Semantic Data Layer, and Agentic Memory within ZoomInfo&#39;s Intelligence team.</p>\n<p>Work alongside PMs responsible for signals and ML scoring/recommendation models.</p>\n<p>Together, you ensure our agentic workflows fill context windows with high-quality, information-dense content exactly when needed.</p>\n<p>Pace &amp; Problems</p>\n<p>Fast-moving engineering team that understands the space.</p>\n<p>Company-wide AI adoption push creates both urgency and opportunity.</p>\n<p>Expect interesting problems: How do we maintain sub-200ms retrieval latency at scale?</p>\n<p>When does GraphRAG justify its indexing cost?</p>\n<p>How do we balance context freshness with cache efficiency?</p>\n<p>You&#39;ll shape answers that become architectural patterns across the organization.</p>\n<p>Impact</p>\n<p>Define a nascent discipline at a company that&#39;s already AI-first in product thinking and organizational structure.</p>\n<p>Your architectural decisions compound,every improvement to context quality multiplies across Copilot, GTM Studio, MarketingOS, and future products we haven&#39;t imagined yet.</p>\n<p>This is infrastructure work with direct line-of-sight to customer value.</p>\n<p>#LI-PS1 #LI-remote</p>\n<p style=\"margin-top:24px;font-size:13px;color:#666;\">XML job scraping automation by <a href=\"https://yubhub.co\">YubHub</a></p>","url":"https://yubhub.co/jobs/job_77ff2013-8f9","directApply":true,"hiringOrganization":{"@type":"Organization","name":"ZoomInfo","sameAs":"https://www.zoominfo.com/","logo":"https://logos.yubhub.co/zoominfo.com.png"},"x-apply-url":"https://job-boards.greenhouse.io/zoominfo/jobs/8206116002","x-work-arrangement":"remote","x-experience-level":"senior","x-job-type":"full-time","x-salary-range":"$89,200-$133,800 USD","x-skills-required":["Product Management","ML/AI Infrastructure","RAG Systems","Vector Databases","Semantic Search","Context Management","Graph Databases","Context Compression","Embedding Models","Retrieval Evaluation Frameworks"],"x-skills-preferred":[],"datePosted":"2026-04-18T15:44:52.232Z","jobLocation":{"@type":"Place","address":{"@type":"PostalAddress","addressLocality":"Waltham, Massachusetts, United States"}},"jobLocationType":"TELECOMMUTE","employmentType":"FULL_TIME","occupationalCategory":"Engineering","industry":"Technology","skills":"Product Management, ML/AI Infrastructure, RAG Systems, Vector Databases, Semantic Search, Context Management, Graph Databases, Context Compression, Embedding Models, Retrieval Evaluation Frameworks","baseSalary":{"@type":"MonetaryAmount","currency":"USD","value":{"@type":"QuantitativeValue","minValue":89200,"maxValue":133800,"unitText":"YEAR"}}},{"@context":"https://schema.org","@type":"JobPosting","identifier":{"@type":"PropertyValue","name":"YubHub","value":"job_4d14bef3-77e"},"title":"Staff Software Engineer - AI Applications","description":"<p>We believe that the way people interact with their finances will drastically improve in the next few years. We&#39;re dedicated to empowering this transformation by building the tools and experiences that thousands of developers use to create their own products. Plaid powers the tools millions of people rely on to live a healthier financial life.</p>\n<p>We work with thousands of companies like Venmo, SoFi, several of the Fortune 500, and many of the largest banks to make it easy for people to connect their financial accounts to the apps and services they want to use. Plaid&#39;s network covers 12,000 financial institutions across the US, Canada, UK and Europe.</p>\n<p>The AI Applications Team You will have the opportunity to join as one of the founding members of this newly formed team that is dedicated to consolidating and rapidly scaling our successful bets so far, and grow with the team in our quest to accelerate Plaid&#39;s transformation into an AI-first company.</p>\n<p>In this role you will lead projects that enable and scale our business with our largest AI customers and partners, starting with personal finance use cases and expanding into many others; examples include:</p>\n<ul>\n<li>Develop and evolve the preferred integration pattern for Plaid with AI providers - from API adaptations to building the official Plaid MCP Servers, and beyond</li>\n</ul>\n<ul>\n<li>Redefine how Plaid&#39;s consumer link experience embed into conversational interfaces in the most seamless way</li>\n</ul>\n<ul>\n<li>Architect the trust layer for the future of agentic commerce that will become the industry standard</li>\n</ul>\n<p>Additionally you will be expected to scale and extend our existing successful bets on AI-powered customer experience; examples include:</p>\n<ul>\n<li>Make the next step-function improvement in our homegrown customer support agent</li>\n</ul>\n<ul>\n<li>Land our multi-turn and multi-agent system that powers a truly delightful experience for our customers; define how to scalably run offline evaluation for complex multi-turn open-ended tasks; research and prototype how Human-In-The-Loop - Reinforcement Learning (RLHF) can power an insights flywheel; pioneer the architecture for customer-specific long-term memory, etc.</li>\n</ul>\n<ul>\n<li>Extend our agentic system to support other critical parts of the customer journey, starting with areas with the highest ROI - top-of-funnel product recommendation, customer onboarding and risk diligence, customer activation and assistance for faster productionization, as well as upselling and cross-selling of Plaid products</li>\n</ul>\n<p>You will have a front row seat to all the latest industry developments. Over time, with the skills and experience you develop and hone on this team, you can become an influential voice in defining where AI &lt; Fintech will be heading longer term.</p>\n<p><strong>Responsibilities</strong></p>\n<ul>\n<li>Build across the stack. Design, develop, and maintain scalable backend services and APIs, as well as intuitive, high-quality frontend applications that bring those systems to life.</li>\n</ul>\n<ul>\n<li>Work with other AI engineers, software engineers and machine learning engineers to architect, design and implement GenAI-powered products and features</li>\n</ul>\n<ul>\n<li>Collaborate across functions to understand user needs, propose and implement AI-powered solutions where they’re expected to have the highest impact</li>\n</ul>\n<ul>\n<li>Design and execute rapid experiments to push the boundaries on potential business impact from emerging AI capabilities, with a focus on minimal viable testing approaches</li>\n</ul>\n<ul>\n<li>Balance creative exploration of possibilities with rigorous evaluation of technical feasibility, product potential and business impact</li>\n</ul>\n<p><strong>Requirements</strong></p>\n<ul>\n<li>Experience building backend services and working with microservices or service-oriented architectures</li>\n</ul>\n<ul>\n<li>Strong working knowledge of HTML, CSS, JavaScript, and modern frontend frameworks or libraries, with comfort building user-facing experiences</li>\n</ul>\n<ul>\n<li>Hands-on experience working with LLMs to build products and shipping them to product with iterating with real user feedback - including but not limited to:</li>\n</ul>\n<ul>\n<li>Prompt engineering</li>\n</ul>\n<ul>\n<li>Fine-tuning</li>\n</ul>\n<ul>\n<li>Retrieval augmented generation (RAG)</li>\n</ul>\n<ul>\n<li>Semantic search</li>\n</ul>\n<ul>\n<li>Vector database and embedding models</li>\n</ul>\n<ul>\n<li>Agent orchestration framework</li>\n</ul>\n<ul>\n<li>Evaluation and monitoring framework of open-ended tasks</li>\n</ul>\n<ul>\n<li>Streaming and SSE</li>\n</ul>\n<ul>\n<li>Common UX and design patterns for GenAI-powered products</li>\n</ul>\n<ul>\n<li>Strong debugging and monitoring experience for production systems</li>\n</ul>\n<ul>\n<li>Ability to deeply understand customer and user needs through user research and rapid experimentation - be your own technical PM</li>\n</ul>\n<ul>\n<li>Ability to balance divergent thinking (exploring possibilities) with convergent thinking (evaluating feasibility), which is critical for driving 0 -&gt;1 projects</li>\n</ul>\n<ul>\n<li>Extremely curious and passionate about working in GenAI applications space</li>\n</ul>\n<p><strong>Nice-to-Haves</strong></p>\n<ul>\n<li>Experience training and/or serving ML models in production, or fine-tuning LLMs for domain-specific use cases</li>\n</ul>\n<ul>\n<li>Comfortable operating in privacy/PII-sensitive environments and applying compliance mitigations</li>\n</ul>\n<p style=\"margin-top:24px;font-size:13px;color:#666;\">XML job scraping automation by <a href=\"https://yubhub.co\">YubHub</a></p>","url":"https://yubhub.co/jobs/job_4d14bef3-77e","directApply":true,"hiringOrganization":{"@type":"Organization","name":"Plaid","sameAs":"https://plaid.com/","logo":"https://logos.yubhub.co/plaid.com.png"},"x-apply-url":"https://jobs.lever.co/plaid/a6bf6eeb-6486-4e45-a3b2-e712f32523d3","x-work-arrangement":"hybrid","x-experience-level":"staff","x-job-type":"full-time","x-salary-range":"$228,360-$369,800 per year","x-skills-required":["backend services","microservices","service-oriented architectures","HTML","CSS","JavaScript","modern frontend frameworks","LLMs","prompt engineering","fine-tuning","retrieval augmented generation","semantic search","vector database","embedding models","agent orchestration framework","evaluation and monitoring framework","streaming","SSE","UX and design patterns","debugging","monitoring"],"x-skills-preferred":[],"datePosted":"2026-04-17T12:55:58.129Z","jobLocation":{"@type":"Place","address":{"@type":"PostalAddress","addressLocality":"San Francisco"}},"employmentType":"FULL_TIME","occupationalCategory":"Engineering","industry":"Finance","skills":"backend services, microservices, service-oriented architectures, HTML, CSS, JavaScript, modern frontend frameworks, LLMs, prompt engineering, fine-tuning, retrieval augmented generation, semantic search, vector database, embedding models, agent orchestration framework, evaluation and monitoring framework, streaming, SSE, UX and design patterns, debugging, monitoring","baseSalary":{"@type":"MonetaryAmount","currency":"USD","value":{"@type":"QuantitativeValue","minValue":228360,"maxValue":369800,"unitText":"YEAR"}}},{"@context":"https://schema.org","@type":"JobPosting","identifier":{"@type":"PropertyValue","name":"YubHub","value":"job_7d9b8590-1c7"},"title":"Senior Software Engineer - AI Applications","description":"<p>We believe that the way people interact with their finances will drastically improve in the next few years. We&#39;re dedicated to empowering this transformation by building the tools and experiences that thousands of developers use to create their own products.</p>\n<p>Plaid powers the tools millions of people rely on to live a healthier financial life. We work with thousands of companies like Venmo, SoFi, several of the Fortune 500, and many of the largest banks to make it easy for people to connect their financial accounts to the apps and services they want to use.</p>\n<p><strong>Responsibilities</strong></p>\n<ul>\n<li>Build across the stack. Design, develop, and maintain scalable backend services and APIs, as well as intuitive, high-quality frontend applications that bring those systems to life.</li>\n<li>Work with other AI engineers, software engineers and machine learning engineers to architect, design and implement GenAI-powered products and features</li>\n<li>Collaborate across functions to understand user needs, propose and implement AI-powered solutions where they’re expected to have the highest impact</li>\n<li>Design and execute rapid experiments to push the boundaries on potential business impact from emerging AI capabilities, with a focus on minimal viable testing approaches</li>\n<li>Balance creative exploration of possibilities with rigorous evaluation of technical feasibility, product potential and business impact</li>\n</ul>\n<p><strong>Qualifications</strong></p>\n<ul>\n<li>Experience building backend services and working with microservices or service-oriented architectures</li>\n<li>Strong working knowledge of HTML, CSS, JavaScript, and modern frontend frameworks or libraries, with comfort building user-facing experiences</li>\n<li>Strong software engineering fundamentals, including system design and API development</li>\n<li>Hands-on experience building and shipping LLM-powered products, iterating with real user feedback</li>\n<li>Practical experience with prompt engineering, fine-tuning, RAG, semantic search (vector databases and embeddings), agent orchestration frameworks, and evaluation/monitoring of open-ended tasks</li>\n<li>Experience building GenAI-powered product experiences, including streaming/SSE and common UX patterns</li>\n<li>Strong debugging and production monitoring experience</li>\n<li>Ability to deeply understand customer needs through user research and rapid experimentation; comfortable operating as a technical PM when needed</li>\n<li>Ability to balance divergent exploration with pragmatic execution, especially in 0 to 1 environments</li>\n<li>Deep curiosity and passion for building GenAI applications</li>\n</ul>\n<p><strong>Nice to Have</strong></p>\n<ul>\n<li>Experience training and deploying ML models in production, including fine-tuning LLMs for domain-specific use cases</li>\n<li>Comfortable operating in privacy- and PII-sensitive environments, with experience applying appropriate compliance and data protection controls</li>\n</ul>\n<p style=\"margin-top:24px;font-size:13px;color:#666;\">XML job scraping automation by <a href=\"https://yubhub.co\">YubHub</a></p>","url":"https://yubhub.co/jobs/job_7d9b8590-1c7","directApply":true,"hiringOrganization":{"@type":"Organization","name":"Plaid","sameAs":"https://plaid.com/","logo":"https://logos.yubhub.co/plaid.com.png"},"x-apply-url":"https://jobs.lever.co/plaid/0afb2b7b-7e54-40e4-a8f6-642ac1df00f6","x-work-arrangement":"hybrid","x-experience-level":"senior","x-job-type":"full-time","x-salary-range":"$209,880-$315,480 per year","x-skills-required":["backend services","microservices","service-oriented architectures","HTML","CSS","JavaScript","modern frontend frameworks","LLM-powered products","prompt engineering","fine-tuning","RAG","semantic search","agent orchestration frameworks","evaluation/monitoring of open-ended tasks","GenAI-powered product experiences","streaming/SSE","common UX patterns","debugging","production monitoring"],"x-skills-preferred":[],"datePosted":"2026-04-17T12:51:25.836Z","jobLocation":{"@type":"Place","address":{"@type":"PostalAddress","addressLocality":"San Francisco"}},"employmentType":"FULL_TIME","occupationalCategory":"Engineering","industry":"Finance","skills":"backend services, microservices, service-oriented architectures, HTML, CSS, JavaScript, modern frontend frameworks, LLM-powered products, prompt engineering, fine-tuning, RAG, semantic search, agent orchestration frameworks, evaluation/monitoring of open-ended tasks, GenAI-powered product experiences, streaming/SSE, common UX patterns, debugging, production monitoring","baseSalary":{"@type":"MonetaryAmount","currency":"USD","value":{"@type":"QuantitativeValue","minValue":209880,"maxValue":315480,"unitText":"YEAR"}}},{"@context":"https://schema.org","@type":"JobPosting","identifier":{"@type":"PropertyValue","name":"YubHub","value":"job_62efca6f-b6f"},"title":"Senior AI Engineer","description":"<p>We&#39;re looking for a Senior AI Engineer who is obsessed with building AI systems that actually work in production: reliable, observable, cost-efficient, and genuinely useful. This is not a research role. You will ship AI-powered features that process real financial data for real businesses.</p>\n<p>LLM &amp; AI Pipeline Engineering - Design, build, and maintain production-grade LLM integration pipelines , including retrieval-augmented generation (RAG), prompt engineering, output parsing, and chain orchestration.</p>\n<p>Develop and operate AI features within Jeeves&#39;s core financial products: spend categorization, document extraction, anomaly detection, financial Q&amp;A, and automated reconciliation.</p>\n<p>Implement structured output validation, fallback handling, and confidence scoring to ensure AI decisions meet reliability standards for financial use cases.</p>\n<p>Evaluate and integrate AI frameworks and tools (LangChain, LlamaIndex, OpenAI API, Anthropic API, HuggingFace, vector databases) and advocate for the right tool for the job.</p>\n<p>Establish prompt versioning and evaluation practices to ensure AI outputs remain accurate and consistent as models and data evolve.</p>\n<p>Retrieval &amp; Vector Search - Design and maintain vector search pipelines using databases such as Pinecone, Weaviate, or pgvector to power semantic search and RAG-based features.</p>\n<p>Build document ingestion and chunking pipelines for Jeeves&#39;s financial data , processing invoices, receipts, policy documents, and transaction records.</p>\n<p>Optimize retrieval quality through embedding model selection, chunk strategy, metadata filtering, and re-ranking techniques.</p>\n<p>ML Model Serving &amp; Operations - Collaborate with data scientists to take trained ML models from experimental notebooks to production serving infrastructure.</p>\n<p>Build and maintain model serving endpoints with appropriate latency SLOs, input validation, and output monitoring.</p>\n<p>Implement model performance monitoring and data drift detection to ensure production models remain accurate over time.</p>\n<p>Support model retraining workflows by designing clean data pipelines and feature engineering that can be continuously updated.</p>\n<p>Backend Integration &amp; Reliability - Integrate AI services cleanly with Jeeves&#39;s backend microservices , designing clear API contracts, circuit breakers, and graceful degradation patterns.</p>\n<p>Write high-quality, testable backend code in Python or Go/Node.js to power AI-integrated features.</p>\n<p>Instrument AI components with structured logging, distributed tracing, latency dashboards, and alerting to ensure operational visibility.</p>\n<p>Collaboration &amp; Growth - Partner with Product, Backend Engineering, and Data Science to define the AI roadmap and translate requirements into reliable systems.</p>\n<p>Contribute to a culture of quality by writing design docs, reviewing peers&#39; AI system designs, and sharing learnings openly.</p>\n<p>Help grow the AI engineering practice at Jeeves by establishing patterns, tooling, and best practices that the broader team can build on.</p>\n<p style=\"margin-top:24px;font-size:13px;color:#666;\">XML job scraping automation by <a href=\"https://yubhub.co\">YubHub</a></p>","url":"https://yubhub.co/jobs/job_62efca6f-b6f","directApply":true,"hiringOrganization":{"@type":"Organization","name":"Jeeves","sameAs":"https://www.jeeves.com/","logo":"https://logos.yubhub.co/jeeves.com.png"},"x-apply-url":"https://jobs.lever.co/tryjeeves/ded9e04e-f18e-4d4c-ae43-4b7882c6200b","x-work-arrangement":"remote","x-experience-level":"senior","x-job-type":"full-time","x-salary-range":null,"x-skills-required":["LLM","AI","Python","LangChain","LlamaIndex","OpenAI API","Anthropic API","HuggingFace","vector databases","Pinecone","Weaviate","pgvector","semantic search","RAG-based features","document ingestion","chunking pipelines","embedding model selection","chunk strategy","metadata filtering","re-ranking techniques","model serving infrastructure","latency SLOs","input validation","output monitoring","model performance monitoring","data drift detection","clean data pipelines","feature engineering","API contracts","circuit breakers","graceful degradation patterns","structured logging","distributed tracing","latency dashboards","alerting"],"x-skills-preferred":[],"datePosted":"2026-04-17T12:39:23.341Z","jobLocation":{"@type":"Place","address":{"@type":"PostalAddress","addressLocality":"India"}},"jobLocationType":"TELECOMMUTE","employmentType":"FULL_TIME","occupationalCategory":"Engineering","industry":"Finance","skills":"LLM, AI, Python, LangChain, LlamaIndex, OpenAI API, Anthropic API, HuggingFace, vector databases, Pinecone, Weaviate, pgvector, semantic search, RAG-based features, document ingestion, chunking pipelines, embedding model selection, chunk strategy, metadata filtering, re-ranking techniques, model serving infrastructure, latency SLOs, input validation, output monitoring, model performance monitoring, data drift detection, clean data pipelines, feature engineering, API contracts, circuit breakers, graceful degradation patterns, structured logging, distributed tracing, latency dashboards, alerting"}]}