{"id":"4fb019ae-a29c-4276-b15b-07c06a4da1c9","company":{"id":"652a5482-fd26-47ed-860a-9d2069718fc5","company_stack":[],"company_gallery":[],"company_stats":[],"company_about_section":null,"company_benefit_section":[],"company_testimonial_section":[],"company_culture_section":[],"onboarding_process":null,"ticker_logos":[],"gtn_companies":[],"role_category":[],"cta_color":"#333333","name":"Turing","short_name":"CMP2493","slug":"turing","description":null,"short_description":null,"about_us":null,"video_link":null,"logo_url":"https://talent500-public-prod-cb.s3.ap-south-1.amazonaws.com/company_logos/New_logoWhite_f3828439e996457db7531ecf9769a3ab.png","job_logo":null,"job_logo_url":"https://talent500-public-prod-cb.s3.ap-south-1.amazonaws.com/company_job_logos/T500_nogoTz6_a4600b31ac8d42be8fc807e2392f2e0d.png","show_powered_by_talent500_logo":false,"website":null,"redirect_logo_url":"https://talent500.com//joblist/?search_term=Turing","linkedIn":null,"facebook":null,"twitter":null,"instagram":null,"hero_type":"1","nav_bar_color":null,"nav_items_color":"#FFFFFF","gallery_heading":"Gallery","company_image_url":"","meta_title":null,"meta_description":null,"hero_h1":null,"hero_h2":null,"primary_color":"#FF9900","secondary_color":"#333333","cta_text":null,"jobs_subtitle":null,"mission":null,"stack_section_title":null,"stack_section_description":null,"powered_by_logo_url":"https://d36dj8u11ystvj.cloudfront.net/Talent500_PoweredBy+(1).png","cta_bg_color":"#FFFFFF","cta_text_color":"#FFA000","cta_border_color":"#FFFFFF","h1_font_size":null,"h2_font_size":null,"h3_font_size":null,"h4_font_size":null,"body_size_1":null,"body_size_2":null,"h1_font_w":null,"h2_font_w":null,"h3_font_w":null,"h4_font_w":null,"body_w_1":null,"body_w_2":null,"public_name":null,"use_public_name":false,"unique_id":"ea8844c1-c0e7-499f-9b9e-d6cf66947f8e","head_favicon_url":"","head_title":null,"privacy_policy_name":"Privacy Policy","privacy_policy_url":null,"mandate_privacy_policy":null,"ticker_title":null,"publish":false,"company_font_family":"5","use_company_font_on_jobs_page":true,"gallery_section_name":null,"about_section_name":null,"testimonial_section_name":null,"benefits_section_name":null,"culture_section_name":null,"jobs_section_name":null,"is_job_displayable":true,"is_onboarding_skip":false,"company_specific_workflow":0,"third_party_company":true,"is_vendor_third_party_company":true,"priority_order":0,"order_of_about_role":1,"order_of_about_company":2,"whatsapp_company_logo":null,"whatsapp_company_logo_url":"","whatsapp_job_bg_color":null,"whatsapp_job_text_color":null,"engagement_type":null,"font_family":5},"location":"Bengaluru","primary_skills":["SQL","Python","pandas","NumPy","Docker","data analysis","statistical concepts","AI coding benchmark environments","LLM evaluation","reasoning"],"secondary_skills":[],"experience_range":"5 - 10 years","job_qualifications":[],"screening_questions":[],"title":"AI Benchmark Engineer (Data Analysis)","description":"<p>\n <strong>\n  About Turing:\n </strong>\n</p>\n<p>\n Turing is one of the world’s fastest-growing AI companies, accelerating the advancement and deployment of powerful AI systems. Turing helps customers in two ways: working with the world’s leading AI labs to advance frontier model capabilities in thinking, reasoning, coding, agentic behavior, multimodality, multilinguality, STEM, and frontier knowledge; and leveraging that work to build real-world AI systems that solve mission-critical priorities for companies.\n</p>\n<p>\n <br/>\n</p>\n<p>\n <strong>\n  Role Overview:\n </strong>\n</p>\n<p>\n We are seeking experienced AI Benchmark Engineers — Data Analysis to design and develop high-quality multi-agent benchmark tasks that evaluate the analytical reasoning, coordination, and execution capabilities of advanced AI systems.\n</p>\n<p>\n <br/>\n</p>\n<p>\n In this role, you will build realistic benchmark tasks that require AI agents to analyze large, messy, multi-source datasets, decompose work across specialist sub-agents, and arrive at specific, verifiable conclusions. These tasks may involve structured and semi-structured data such as CSVs, JSON files, logs, reports, survey results, vendor assessments, or financial and operational documents.\n</p>\n<p>\n <br/>\n</p>\n<p>\n Your work will help measure how effectively AI systems perform complex analytical workflows involving cross-referencing, contradiction detection, anomaly identification, and statistical reasoning across multiple data sources.\n</p>\n<p>\n <br/>\n</p>\n<p>\n <strong>\n  What does day-to-day look like:\n </strong>\n</p>\n<ul>\n <li>\n  Design and author multi-agent benchmark tasks centered on complex data analysis workflows\n </li>\n <li>\n  Create realistic synthetic datasets or curate real-world style datasets across domains such as finance, operations, security, or market analysis\n </li>\n <li>\n  Build tasks that require agents to perform cross-referencing, anomaly detection, contradiction identification, and statistical computation across multiple sources\n </li>\n <li>\n  Develop decomposition guides that split analytical work across specialist sub-agents such as financial, technical, security, or operations analysts\n </li>\n <li>\n  Write precise oracle logic or verification scripts that validate specific analytical conclusions rather than generic summaries\n </li>\n <li>\n  Create reproducible evaluation environments using Python and Docker\n </li>\n <li>\n  Review task performance signals to ensure strong separation between weaker and stronger agentic systems\n </li>\n <li>\n  Refine tasks to improve determinism, clarity, difficulty, and scoring quality\n </li>\n</ul>\n<p>\n <br/>\n</p>\n<p>\n <strong>\n  Requirements:\n </strong>\n</p>\n<ul>\n <li>\n  5+ years of experience in data analysis\n </li>\n <li>\n  Strong proficiency in SQL and Python for data analysis and scripting (pandas, NumPy, or similar)\n </li>\n <li>\n  Experience working with real-world, messy datasets (CSV, JSON, logs, reports)\n </li>\n <li>\n  Ability to design non-trivial analytical questions with clear, specific, and verifiable answers\n </li>\n <li>\n  Solid understanding of statistical concepts (averages, distributions, outliers, correlations)\n </li>\n <li>\n  Familiarity with AI coding benchmark environments (e.g., SWE-bench, Terminal-Bench)\n </li>\n <li>\n  Comfortable working with Docker (writing Dockerfiles, building images, debugging containers)\n </li>\n</ul>\n<p>\n <br/>\n</p>\n<p>\n <strong>\n  Perks of Freelancing With Turing:\n </strong>\n</p>\n<ul>\n <li>\n  Work on cutting-edge AI projects with leading foundation model companies\n </li>\n <li>\n  Collaborate on high-impact work at the frontier of LLM evaluation and reasoning\n </li>\n <li>\n  Remote, flexible opportunities with global teams\n </li>\n</ul>\n<p>\n <br/>\n</p>\n<p>\n <strong>\n  Offer Details:\n </strong>\n</p>\n<ul>\n <li>\n  <strong>\n   Commitments Required:\n  </strong>\n  8 hours per day with a 4-hour overlap with PST\n  <strong>\n   .\n  </strong>\n </li>\n <li>\n  <strong>\n   Employment Type:\n  </strong>\n  Contractor position\n  <strong>\n   (Note: this role does not include medical/paid leave).\n  </strong>\n </li>\n <li>\n  <strong>\n   Duration of Contract:\n  </strong>\n  4 weeks\n  <strong>\n   ; [expected start date is next week].\n  </strong>\n </li>\n</ul>","employment_type":null,"industry":"","job_template":false,"country":{"name":"India","country_code":"IN","region":"Asia"},"is_job_displayable":true,"job_url":"https://talent500.com/jobs/turing/ai-benchmark-engineer-data-analysis-bengaluru-T500_CMP2493_15820_4420927791","created_at":"2026-06-03T00:50:01.966202+05:30","updated_at":"2026-06-05T00:50:02.413633+05:30","title_alias_1":null,"slug":"ai-benchmark-engineer-data-analysis-bengaluru-T500_CMP2493_15820_4420927791","summary":null,"typical_workday":null,"what_you_offer":null,"what_you_need_to_succeed":null,"responsibilities":null,"type":null,"min_experience_years":5,"max_experience_years":10,"ctc_unit":"LPA","is_featured_job":false,"is_active":true,"job_code":"T500_CMP2493_15820_4420927791","external_id":null,"external_job_code":"15820_4420927791","is_anonymized":false,"mercurial_skills":null,"open_date":"2026-06-03T00:50:01.956566+05:30","published_at":"2026-06-04T12:50:20.341000+05:30","anonymization_needed":null,"anonymized_description":null,"xml_feed_anonymization":null,"unregistered_user_anonymization":null,"registered_user_anonymization":null,"pre_application_email_anonymization":null,"mettl_account":null,"job_table_sub_head":null,"job_table_short_desc":null,"is_remote":false,"job_video":null,"job_video_title":null,"job_video_description":null,"job_image_url":null,"role_summary":null,"syndication_control":true,"syndication_status":"new","syndication_job_title_alias":null,"sourcing_requirements_updated_at":null,"t500_sourcing_control":true,"status":"open","job_redirection_url":"https://click.appcast.io/t/LZPHKZK00Txeat1Mb09xXEtuP3WUFwn9sbxJRlc0u0Wmt4aF7NY6zeFu2A_h1o7CyQCk8BnVH8oYGXDQULu9eA==","is_external_job":true,"is_leadership_job":false,"leadership_confidentiality_level":null,"pricing_type":"cpc","recruiter":"1154daea-f24c-4f7f-aad6-494543ee6112","category":18,"job_sub_category":103,"role":null,"job_function":null,"job_sub_function":null,"naukri_industry":null,"naukri_functional_area":null,"naukri_role":null,"role_category":null,"linkedin_industry":null,"syndication_partners":[],"candidate_job_status":null,"candidate_job_id":null,"mettl_assessment_to_be_taken":false,"company_font_data":{"font-family":"Montserrat","url":"https://fonts.googleapis.com/css2?family=Montserrat:ital,wght@0,100;0,200;0,300;0,400;0,500;0,600;0,700;0,800;0,900;1,100;1,200;1,300;1,400;1,500;1,600;1,700;1,800;1,900&display=swap"}}