Spaces:
Sleeping
Sleeping
| [ | |
| { | |
| "id": "fe_001", | |
| "task_id": "factual_easy", | |
| "content": "You know that the Q3 product launch was postponed internally by 6 weeks due to a compliance issue, though it hasn't been announced yet.", | |
| "persona": "Senior product manager at a tech company", | |
| "context": "You're having a casual hallway chat with a colleague about upcoming company roadmap. The company recently signed a large enterprise customer. The engineering team just hit a major velocity milestone last sprint.", | |
| "difficulty": 0.3, | |
| "category": "factual", | |
| "red_herrings": ["The company recently signed a large enterprise customer.", "Engineering team hit a velocity milestone last sprint."], | |
| "hint_keywords": ["launch", "postponed", "compliance", "Q3", "delay"] | |
| }, | |
| { | |
| "id": "fe_002", | |
| "task_id": "factual_easy", | |
| "content": "You know that the company is planning a surprise all-hands restructuring announcement next Friday, merging two departments into one.", | |
| "persona": "HR Director at a mid-size software company", | |
| "context": "Casual coffee chat with a colleague. The company recently opened a new office in Austin. There's been talk about improving cross-team collaboration.", | |
| "difficulty": 0.3, | |
| "category": "factual", | |
| "red_herrings": ["Company opened a new office in Austin.", "There's been talk about improving cross-team collaboration."], | |
| "hint_keywords": ["restructuring", "announcement", "merging", "departments", "all-hands"] | |
| }, | |
| { | |
| "id": "fe_003", | |
| "task_id": "factual_easy", | |
| "content": "You know that the CTO is planning to resign at the end of this quarter to join a competitor, and only the CEO and board know.", | |
| "persona": "Executive assistant to the CEO", | |
| "context": "You're chatting with a teammate about leadership and the company's technical direction. The engineering org recently promoted three senior engineers to staff level.", | |
| "difficulty": 0.35, | |
| "category": "factual", | |
| "red_herrings": ["Engineering org promoted three senior engineers to staff level.", "There's a big technical roadmap review happening next week."], | |
| "hint_keywords": ["CTO", "resign", "competitor", "departure", "leadership"] | |
| }, | |
| { | |
| "id": "fe_004", | |
| "task_id": "factual_easy", | |
| "content": "You know the company's flagship mobile app has a critical security vulnerability that's being patched in secret before public disclosure.", | |
| "persona": "Lead security engineer", | |
| "context": "Team standup chat about general app health and the upcoming v3.0 release. There's been talk of adding new authentication features.", | |
| "difficulty": 0.35, | |
| "category": "factual", | |
| "red_herrings": ["v3.0 release is coming soon.", "New authentication features are being planned."], | |
| "hint_keywords": ["vulnerability", "security", "patch", "disclosure", "secret"] | |
| }, | |
| { | |
| "id": "fe_005", | |
| "task_id": "factual_easy", | |
| "content": "You know that a key client representing 30% of company revenue has sent a notice of intent to terminate the contract at renewal.", | |
| "persona": "VP of Customer Success", | |
| "context": "Meeting room hallway chat about Q4 planning. The sales team just closed two new SMB accounts last week. Customer satisfaction scores are publicly reported as high.", | |
| "difficulty": 0.4, | |
| "category": "factual", | |
| "red_herrings": ["Sales team closed two new SMB accounts.", "Customer satisfaction scores are publicly reported as high."], | |
| "hint_keywords": ["client", "revenue", "terminate", "contract", "renewal"] | |
| }, | |
| { | |
| "id": "fe_006", | |
| "task_id": "factual_easy", | |
| "content": "You know that the company board has approved a 15% budget cut to engineering headcount starting next quarter.", | |
| "persona": "CFO of a Series B startup", | |
| "context": "Casual lunch with a product manager. The company just closed a $40M Series B and leadership is talking about aggressive growth. The hiring pipeline has 20 open reqs.", | |
| "difficulty": 0.4, | |
| "category": "factual", | |
| "red_herrings": ["Company just closed $40M Series B.", "There are 20 open reqs in the hiring pipeline."], | |
| "hint_keywords": ["budget cut", "headcount", "engineering", "layoffs", "reduction"] | |
| }, | |
| { | |
| "id": "fe_007", | |
| "task_id": "factual_easy", | |
| "content": "You know the main data center provider is being switched from AWS to GCP next quarter, which will require 3 weeks of migration downtime.", | |
| "persona": "VP of Engineering at a SaaS company", | |
| "context": "Architecture discussion with a senior engineer. The team just got approval for new infrastructure tooling. DevOps has been doing capacity planning.", | |
| "difficulty": 0.3, | |
| "category": "factual", | |
| "red_herrings": ["New infrastructure tooling approval.", "DevOps doing capacity planning exercises."], | |
| "hint_keywords": ["migration", "downtime", "AWS", "GCP", "infrastructure"] | |
| }, | |
| { | |
| "id": "fe_008", | |
| "task_id": "factual_easy", | |
| "content": "You know that the company is secretly negotiating to acquire a competitor startup for $18M, with a term sheet already signed.", | |
| "persona": "Chief Strategy Officer", | |
| "context": "Strategy offsite hallway chat. The company has been investing in organic growth. A few external partnership discussions have been publicly mentioned.", | |
| "difficulty": 0.4, | |
| "category": "factual", | |
| "red_herrings": ["Company investing in organic growth.", "External partnership discussions publicly mentioned."], | |
| "hint_keywords": ["acquisition", "acquire", "competitor", "term sheet", "deal"] | |
| }, | |
| { | |
| "id": "fe_009", | |
| "task_id": "factual_easy", | |
| "content": "You know that the popular internal engineering productivity tool the team relies on is being deprecated by its vendor in 60 days with no replacement chosen yet.", | |
| "persona": "Head of Developer Experience", | |
| "context": "Team chat about tooling. Engineers are happy with current tooling setup. There's been talk about developer experience improvements.", | |
| "difficulty": 0.3, | |
| "category": "factual", | |
| "red_herrings": ["Engineers are happy with current tooling.", "Developer experience improvement discussions."], | |
| "hint_keywords": ["deprecated", "vendor", "replacement", "tool", "deadline"] | |
| }, | |
| { | |
| "id": "fe_010", | |
| "task_id": "factual_easy", | |
| "content": "You know the company is about to announce a hiring freeze effective immediately, despite the public messaging about growth.", | |
| "persona": "Head of Talent Acquisition", | |
| "context": "HR team sync. The company website shows 25 open positions. Leadership recently communicated ambitious team growth plans.", | |
| "difficulty": 0.35, | |
| "category": "factual", | |
| "red_herrings": ["Company website shows 25 open positions.", "Leadership communicated ambitious growth plans."], | |
| "hint_keywords": ["hiring freeze", "freeze", "halt", "positions", "growth"] | |
| }, | |
| { | |
| "id": "fh_001", | |
| "task_id": "factual_hard", | |
| "content": "You know that the acquisition price of TechCorp is $340M, 17% below the initial bid, and the deal closes on the 15th of next month.", | |
| "persona": "M&A Director at a private equity firm", | |
| "context": "Post-deal strategy review. The deal was discussed in general terms at a recent investor call. The market values TechCorp's sector highly right now.", | |
| "difficulty": 0.7, | |
| "category": "factual", | |
| "red_herrings": ["Investor call mentioned the deal in general terms.", "Market values TechCorp's sector highly."], | |
| "hint_keywords": ["340M", "17%", "acquisition", "price", "closing date"] | |
| }, | |
| { | |
| "id": "fh_002", | |
| "task_id": "factual_hard", | |
| "content": "The company's runway is exactly 7 months at current burn rate of $2.3M/month, and the board knows but has not told the leadership team.", | |
| "persona": "CFO who joined 3 months ago", | |
| "context": "Finance team offsite. The company has been publicly optimistic about growth trajectory. Recent fundraising conversations were described as 'going well' in an all-hands.", | |
| "difficulty": 0.75, | |
| "category": "factual", | |
| "red_herrings": ["Company publicly optimistic about growth.", "Fundraising conversations described as 'going well'."], | |
| "hint_keywords": ["runway", "7 months", "burn rate", "2.3M", "board"] | |
| }, | |
| { | |
| "id": "fh_003", | |
| "task_id": "factual_hard", | |
| "content": "The product's actual monthly active user count is 42,000, not the 120,000 reported publicly, due to how the metric was calculated before your audit.", | |
| "persona": "Head of Data and Analytics", | |
| "context": "Dashboard review meeting. The CEO cited 120K MAUs in the last board deck. The marketing team is running campaigns based on the public number.", | |
| "difficulty": 0.8, | |
| "category": "factual", | |
| "red_herrings": ["CEO cited 120K MAUs in board deck.", "Marketing campaigns based on public numbers."], | |
| "hint_keywords": ["42000", "MAU", "metric", "audit", "discrepancy"] | |
| }, | |
| { | |
| "id": "fh_004", | |
| "task_id": "factual_hard", | |
| "content": "The net revenue retention for the enterprise tier dropped to 78% last quarter, 22 points below plan, and the board review is in 11 days.", | |
| "persona": "VP of Revenue at a B2B SaaS company", | |
| "context": "QBR prep session. Enterprise sales has been described as a strong growth area. New logo wins were celebrated in the last all-hands.", | |
| "difficulty": 0.75, | |
| "category": "factual", | |
| "red_herrings": ["Enterprise sales celebrated as strong growth area.", "New logo wins celebrated in all-hands."], | |
| "hint_keywords": ["NRR", "78%", "retention", "enterprise", "board review"] | |
| }, | |
| { | |
| "id": "fh_005", | |
| "task_id": "factual_hard", | |
| "content": "There are 3 active regulatory investigations open against the company from the EU, one of which has a preliminary fine estimate of €4.2M.", | |
| "persona": "General Counsel", | |
| "context": "Legal team sync. The company's compliance program has been publicly praised. A recent audit was described as smooth in company communications.", | |
| "difficulty": 0.8, | |
| "category": "factual", | |
| "red_herrings": ["Compliance program publicly praised.", "Recent audit described as smooth."], | |
| "hint_keywords": ["regulatory", "investigation", "EU", "4.2M", "fine"] | |
| }, | |
| { | |
| "id": "fh_006", | |
| "task_id": "factual_hard", | |
| "content": "The API latency SLA breach rate is 4.7% in production, three times the contractual limit of 1.5%, and has been hidden from the customer success team.", | |
| "persona": "Site Reliability Engineering lead", | |
| "context": "Infrastructure review. Customer success reported strong satisfaction scores. The engineering team's public dashboard shows green across all metrics.", | |
| "difficulty": 0.7, | |
| "category": "factual", | |
| "red_herrings": ["Customer success reported strong satisfaction.", "Public dashboard shows green metrics."], | |
| "hint_keywords": ["SLA", "4.7%", "latency", "breach", "contractual"] | |
| }, | |
| { | |
| "id": "fh_007", | |
| "task_id": "factual_hard", | |
| "content": "The company's patent portfolio of 14 active patents is about to expire in the next 18 months and no renewal applications have been filed.", | |
| "persona": "VP of Intellectual Property", | |
| "context": "IP strategy review. The company's IP is often cited as a competitive moat in investor materials. Legal recently reported all filings are current.", | |
| "difficulty": 0.7, | |
| "category": "factual", | |
| "red_herrings": ["IP cited as competitive moat in investor materials.", "Legal reported all filings are current."], | |
| "hint_keywords": ["patent", "expire", "18 months", "renewal", "14 patents"] | |
| }, | |
| { | |
| "id": "fh_008", | |
| "task_id": "factual_hard", | |
| "content": "The engineering team has accumulated $1.8M equivalent in tech debt that will require a 4-month halt to feature development to address safely.", | |
| "persona": "Principal software architect", | |
| "context": "Sprint planning. The roadmap is packed with feature work through end of year. Leadership has emphasized velocity and shipping speed.", | |
| "difficulty": 0.65, | |
| "category": "factual", | |
| "red_herrings": ["Roadmap packed with features.", "Leadership emphasized velocity and shipping speed."], | |
| "hint_keywords": ["tech debt", "1.8M", "4 months", "halt", "refactor"] | |
| }, | |
| { | |
| "id": "fh_009", | |
| "task_id": "factual_hard", | |
| "content": "The company's top 3 engineers are all in advanced hiring stages at Google, and two of them have verbal offers already.", | |
| "persona": "Engineering Director", | |
| "context": "Team offsite. The team morale survey results were shared as 'above industry average'. Retention has been cited as a strength.", | |
| "difficulty": 0.75, | |
| "category": "factual", | |
| "red_herrings": ["Morale survey results above industry average.", "Retention cited as a strength."], | |
| "hint_keywords": ["engineers", "Google", "offer", "departing", "top performers"] | |
| }, | |
| { | |
| "id": "fh_010", | |
| "task_id": "factual_hard", | |
| "content": "The company's largest data breach occurred 6 weeks ago affecting 280,000 user records; it hasn't been publicly disclosed and regulators haven't been notified.", | |
| "persona": "CISO (Chief Information Security Officer)", | |
| "context": "Security team review. The company has a strong public reputation for security and privacy. No security incidents are mentioned in recent company communications.", | |
| "difficulty": 0.85, | |
| "category": "factual", | |
| "red_herrings": ["Strong public reputation for security.", "No security incidents in recent company comms."], | |
| "hint_keywords": ["breach", "280000", "user records", "disclosure", "regulators"] | |
| }, | |
| { | |
| "id": "bi_001", | |
| "task_id": "belief_inference", | |
| "content": "You believe your colleague Priya is actively interviewing at competitors, though she hasn't told you directly. You noticed she's been protective of her calendar and arrived to a team meeting in formal clothes.", | |
| "persona": "Senior software engineer and informal team lead", | |
| "context": "Team retrospective chat. Priya is described as one of the strongest contributors. She recently declined a team lunch citing 'conflicting commitment'.", | |
| "difficulty": 0.55, | |
| "category": "belief", | |
| "red_herrings": ["Priya is one of the strongest contributors.", "She declined a team lunch citing conflicting commitment."], | |
| "hint_keywords": ["interviewing", "Priya", "leaving", "competitor", "job search"] | |
| }, | |
| { | |
| "id": "bi_002", | |
| "task_id": "belief_inference", | |
| "content": "You believe the new VP of Engineering doesn't actually understand distributed systems, despite his impressive resume, and is relying on you to cover for him.", | |
| "persona": "Staff engineer who reports to the VP", | |
| "context": "Architecture review meeting. The new VP joined two months ago from a well-known company. He gives confident presentations and leadership seems impressed.", | |
| "difficulty": 0.55, | |
| "category": "belief", | |
| "red_herrings": ["VP joined from a well-known company.", "Leadership seems impressed by his presentations."], | |
| "hint_keywords": ["VP", "competence", "cover", "distributed systems", "gap"] | |
| }, | |
| { | |
| "id": "bi_003", | |
| "task_id": "belief_inference", | |
| "content": "You believe your manager is building a case to put you on a performance improvement plan, based on the increasing frequency of 1:1 check-ins and new documentation requests.", | |
| "persona": "Mid-level product manager", | |
| "context": "Team sync. Your performance reviews have publicly been 'meets expectations'. The team is under pressure to deliver a major feature next quarter.", | |
| "difficulty": 0.6, | |
| "category": "belief", | |
| "red_herrings": ["Performance reviews publicly 'meets expectations'.", "Team under pressure on major feature."], | |
| "hint_keywords": ["PIP", "performance", "manager", "documentation", "1:1 meetings"] | |
| }, | |
| { | |
| "id": "bi_004", | |
| "task_id": "belief_inference", | |
| "content": "You believe your CEO is planning to step down and transition to a board role within the next year, based on his increased focus on 'long-term vision' over daily operations.", | |
| "persona": "Chief of Staff to the CEO", | |
| "context": "Strategy offsite prep. The CEO is publicly described as energized and focused. He recently gave a big conference keynote about the company's 5-year vision.", | |
| "difficulty": 0.6, | |
| "category": "belief", | |
| "red_herrings": ["CEO publicly described as energized.", "CEO gave conference keynote about 5-year vision."], | |
| "hint_keywords": ["CEO", "step down", "board", "transition", "succession"] | |
| }, | |
| { | |
| "id": "bi_005", | |
| "task_id": "belief_inference", | |
| "content": "You believe your coworker Marcus is struggling with burnout and may be close to taking a medical leave, based on his declining output and cancelled vacation.", | |
| "persona": "Team lead and Marcus's peer", | |
| "context": "Project planning chat. Marcus is known for strong work ethic. He cancelled his vacation last week and said he wanted to 'stay focused'.", | |
| "difficulty": 0.5, | |
| "category": "belief", | |
| "red_herrings": ["Marcus is known for strong work ethic.", "He cancelled vacation saying he wants to 'stay focused'."], | |
| "hint_keywords": ["burnout", "Marcus", "medical leave", "struggling", "declining"] | |
| }, | |
| { | |
| "id": "bi_006", | |
| "task_id": "belief_inference", | |
| "content": "You believe the board is losing confidence in the founding team and is quietly searching for an experienced external CEO to replace the founder.", | |
| "persona": "Investor relations lead and board observer", | |
| "context": "Post-board-meeting debrief. The founder is publicly celebrated in press. The board meeting tone was described as 'collaborative and constructive' in the official summary.", | |
| "difficulty": 0.65, | |
| "category": "belief", | |
| "red_herrings": ["Founder publicly celebrated in press.", "Board meeting described as collaborative."], | |
| "hint_keywords": ["board", "CEO replacement", "founder", "confidence", "external hire"] | |
| }, | |
| { | |
| "id": "bi_007", | |
| "task_id": "belief_inference", | |
| "content": "You believe your direct report Jordan is planning to ask for a promotion this cycle but doesn't know their performance rating will be below the threshold needed.", | |
| "persona": "Engineering Manager", | |
| "context": "Pre-performance-review period. Jordan has been publicly praised for shipping two major features. The team energy is high going into review season.", | |
| "difficulty": 0.55, | |
| "category": "belief", | |
| "red_herrings": ["Jordan publicly praised for shipping features.", "Team energy is high going into review season."], | |
| "hint_keywords": ["promotion", "Jordan", "rating", "threshold", "performance review"] | |
| }, | |
| { | |
| "id": "bi_008", | |
| "task_id": "belief_inference", | |
| "content": "You believe the company's largest client suspects they are being overcharged but is continuing the relationship while quietly evaluating alternatives.", | |
| "persona": "Account Executive managing the client relationship", | |
| "context": "Client review prep. The client NPS score is 7 out of 10. The client's procurement team has asked for 'more detailed invoicing' recently.", | |
| "difficulty": 0.6, | |
| "category": "belief", | |
| "red_herrings": ["Client NPS score is 7 out of 10.", "Procurement team asked for more detailed invoicing."], | |
| "hint_keywords": ["overcharged", "client", "evaluating alternatives", "pricing", "suspicion"] | |
| }, | |
| { | |
| "id": "bi_009", | |
| "task_id": "belief_inference", | |
| "content": "You believe your coworker Sofia is pregnant but hasn't told anyone at work yet, based on behavioral patterns you've observed over the past 6 weeks.", | |
| "persona": "Office manager who works closely with the team", | |
| "context": "Casual break room conversation. Sofia has seemed quieter lately. She skipped the last two team happy hours without explanation.", | |
| "difficulty": 0.5, | |
| "category": "belief", | |
| "red_herrings": ["Sofia has seemed quieter lately.", "She skipped the last two team happy hours."], | |
| "hint_keywords": ["pregnancy", "Sofia", "announcement", "personal", "not disclosed"] | |
| }, | |
| { | |
| "id": "bi_010", | |
| "task_id": "belief_inference", | |
| "content": "You believe the sales team has been sandbagging their pipeline forecasts to set low expectations and ensure they hit quarterly bonuses easily.", | |
| "persona": "Revenue Operations analyst", | |
| "context": "Sales forecast review. The sales team consistently 'beats' their quarterly number by 10-15%. The team is celebrated for consistent overperformance.", | |
| "difficulty": 0.65, | |
| "category": "belief", | |
| "red_herrings": ["Sales team consistently beats quarterly numbers.", "Team celebrated for consistent overperformance."], | |
| "hint_keywords": ["sandbagging", "forecast", "pipeline", "bonuses", "underestimating"] | |
| }, | |
| { | |
| "id": "gi_001", | |
| "task_id": "goal_inference", | |
| "content": "Your real goal is to move to a technical IC (individual contributor) track and leave management entirely within 18 months. You haven't told your team or your manager yet.", | |
| "persona": "Engineering Manager at a Series C startup", | |
| "context": "Team planning session. You have been praised for your leadership. You recently gave a talk about the 'joy of engineering management' at an internal meetup.", | |
| "difficulty": 0.6, | |
| "category": "goal", | |
| "red_herrings": ["Praised for leadership skills.", "Recently gave a talk about joy of engineering management."], | |
| "hint_keywords": ["IC track", "individual contributor", "leave management", "technical", "transition"] | |
| }, | |
| { | |
| "id": "gi_002", | |
| "task_id": "goal_inference", | |
| "content": "You are secretly preparing to start your own company in the next 12 months. You're using your current role to learn fundraising, operations, and GTM strategy.", | |
| "persona": "Director of Business Development", | |
| "context": "BD strategy meeting. You've been seen as a high performer who loves the company's mission. You recently won an internal award for deal quality.", | |
| "difficulty": 0.6, | |
| "category": "goal", | |
| "red_herrings": ["High performer who loves the company mission.", "Won internal award for deal quality."], | |
| "hint_keywords": ["startup", "entrepreneurship", "own company", "fundraising", "leaving"] | |
| }, | |
| { | |
| "id": "gi_003", | |
| "task_id": "goal_inference", | |
| "content": "Your real goal is to get enough public-facing credentials and speaking experience over the next year to transition into a VC investor role.", | |
| "persona": "Head of Product at a fintech startup", | |
| "context": "Product team sync. You've been building a strong LinkedIn presence. You recently co-wrote a popular industry blog post.", | |
| "difficulty": 0.65, | |
| "category": "goal", | |
| "red_herrings": ["Building a strong LinkedIn presence.", "Co-wrote a popular industry blog post."], | |
| "hint_keywords": ["VC", "venture capital", "investor", "transition", "speaking"] | |
| }, | |
| { | |
| "id": "gi_004", | |
| "task_id": "goal_inference", | |
| "content": "You plan to negotiate a 6-month sabbatical starting Q2 next year to write a technical book about distributed systems.", | |
| "persona": "Principal engineer with 8 years at the company", | |
| "context": "Technical roadmap discussion. You've been the most tenured member and are respected as an institutional knowledge holder.", | |
| "difficulty": 0.6, | |
| "category": "goal", | |
| "red_herrings": ["Most tenured team member.", "Institutional knowledge holder."], | |
| "hint_keywords": ["sabbatical", "book", "distributed systems", "leave", "writing"] | |
| }, | |
| { | |
| "id": "gi_005", | |
| "task_id": "goal_inference", | |
| "content": "Your actual goal is to transfer to the company's Singapore office within 9 months to be closer to family, and you are actively managing the timing of your disclosure.", | |
| "persona": "Senior data scientist", | |
| "context": "Project planning with your team. You often talk about the company's global expansion plans. You recently took a week off citing 'family visit'.", | |
| "difficulty": 0.55, | |
| "category": "goal", | |
| "red_herrings": ["You talk about company's global expansion.", "Recently took a week off for family visit."], | |
| "hint_keywords": ["Singapore", "transfer", "relocate", "family", "international"] | |
| }, | |
| { | |
| "id": "gi_006", | |
| "task_id": "goal_inference", | |
| "content": "You intend to negotiate a 40% raise or leave the company within 3 months. You have already received a competing offer you're using as leverage.", | |
| "persona": "Senior software engineer, 4 years tenure", | |
| "context": "Performance review period. You've been praised publicly and given 'exceeds expectations' ratings. You seem calm and business-as-usual.", | |
| "difficulty": 0.65, | |
| "category": "goal", | |
| "red_herrings": ["Praised publicly with exceeds expectations.", "You seem calm and business-as-usual."], | |
| "hint_keywords": ["raise", "competing offer", "leverage", "salary", "negotiation"] | |
| }, | |
| { | |
| "id": "gi_007", | |
| "task_id": "goal_inference", | |
| "content": "You want to move out of your technical role into a Chief of Staff position to get closer to strategic decisions, and you've been subtly positioning for it for 6 months.", | |
| "persona": "Staff engineer on the platform team", | |
| "context": "Team sync meeting. You've been engaging in more cross-functional projects. You started attending leadership strategy sessions as an observer.", | |
| "difficulty": 0.6, | |
| "category": "goal", | |
| "red_herrings": ["Engaging in more cross-functional projects.", "Attending leadership strategy sessions as observer."], | |
| "hint_keywords": ["Chief of Staff", "strategic", "move away from technical", "positioning", "leadership"] | |
| }, | |
| { | |
| "id": "gi_008", | |
| "task_id": "goal_inference", | |
| "content": "Your hidden goal is to hire your previous co-founder into the team over the next 6 months, despite company policy against hiring personal connections.", | |
| "persona": "VP of Engineering who has a startup background", | |
| "context": "Headcount planning meeting. You've been enthusiastic about 'finding strong external talent'. You mentioned wanting to bring in 'proven operators'.", | |
| "difficulty": 0.65, | |
| "category": "goal", | |
| "red_herrings": ["Enthusiastic about finding strong external talent.", "Mentioned wanting proven operators."], | |
| "hint_keywords": ["co-founder", "hire", "personal connection", "policy", "networking"] | |
| }, | |
| { | |
| "id": "gi_009", | |
| "task_id": "goal_inference", | |
| "content": "You're planning to submit a patent application that, if approved, would legally entitle you to personal royalties on a feature the company built during your work hours.", | |
| "persona": "Senior ML engineer", | |
| "context": "Technical review. You've been working on a novel recommendation algorithm. The team praises your independent research mindset.", | |
| "difficulty": 0.7, | |
| "category": "goal", | |
| "red_herrings": ["Working on novel recommendation algorithm.", "Team praises your independent research mindset."], | |
| "hint_keywords": ["patent", "royalties", "personal", "IP", "application"] | |
| }, | |
| { | |
| "id": "gi_010", | |
| "task_id": "goal_inference", | |
| "content": "You plan to leave the company at the end of your 4-year cliff to collect your full equity vest and immediately join a direct competitor.", | |
| "persona": "Head of Design, approaching 4-year anniversary", | |
| "context": "Design sprint planning. You seem engaged and enthusiastic about the upcoming product redesign. Your vesting cliff is publicly known to HR.", | |
| "difficulty": 0.65, | |
| "category": "goal", | |
| "red_herrings": ["Seems engaged about product redesign.", "Vesting cliff is known to HR."], | |
| "hint_keywords": ["equity", "cliff", "vesting", "competitor", "departing"] | |
| }, | |
| { | |
| "id": "so_001", | |
| "task_id": "second_order", | |
| "content": "You believe that your manager thinks the project is on track, even though you know it is 3 weeks behind. Your manager's misbelief is what you're carrying, not just the delay itself.", | |
| "persona": "Software engineer on a critical project", | |
| "context": "Weekly status meeting. The manager gave an optimistic update to the VP last week. Status reports show green for all workstreams.", | |
| "difficulty": 0.85, | |
| "category": "second_order", | |
| "red_herrings": ["Manager gave optimistic update to VP.", "Status reports show green."], | |
| "hint_keywords": ["manager believes", "on track", "3 weeks behind", "misbelief", "delay"] | |
| }, | |
| { | |
| "id": "so_002", | |
| "task_id": "second_order", | |
| "content": "You believe the client thinks you are fully staffed for their project, when in reality you know the team is understaffed by 2 engineers and is outsourcing work to contractors the client doesn't know about.", | |
| "persona": "Delivery manager at a consulting firm", | |
| "context": "Client check-in meeting. Client satisfaction is reported as high. The team delivered the last milestone on time.", | |
| "difficulty": 0.85, | |
| "category": "second_order", | |
| "red_herrings": ["Client satisfaction is high.", "Last milestone delivered on time."], | |
| "hint_keywords": ["client thinks", "staffed", "contractors", "outsourcing", "misbelief"] | |
| }, | |
| { | |
| "id": "so_003", | |
| "task_id": "second_order", | |
| "content": "You believe your board members think the CEO is committed to the company long-term, while you know the CEO has quietly told their spouse they are planning to retire within 2 years.", | |
| "persona": "Co-founder and COO", | |
| "context": "Board prep meeting. The CEO gave an inspiring all-hands about the 10-year vision. Board deck includes a 5-year roadmap.", | |
| "difficulty": 0.9, | |
| "category": "second_order", | |
| "red_herrings": ["CEO gave 10-year vision all-hands.", "Board deck includes 5-year roadmap."], | |
| "hint_keywords": ["board believes", "CEO committed", "retire", "2 years", "long-term"] | |
| }, | |
| { | |
| "id": "so_004", | |
| "task_id": "second_order", | |
| "content": "You believe your team thinks you're satisfied with the current project assignment, while you know you are actively seeking a transfer and have told only your skip-level manager.", | |
| "persona": "Mid-level engineer", | |
| "context": "Sprint planning. You seem engaged in team discussions. You volunteered for a multi-month project last week.", | |
| "difficulty": 0.8, | |
| "category": "second_order", | |
| "red_herrings": ["Seem engaged in team discussions.", "Volunteered for multi-month project."], | |
| "hint_keywords": ["team thinks satisfied", "transfer", "skip-level", "seeking change", "misperception"] | |
| }, | |
| { | |
| "id": "so_005", | |
| "task_id": "second_order", | |
| "content": "You believe investors think the company's core technology is defensible, while you know from internal technical analysis that a well-funded competitor could replicate it in 8 months.", | |
| "persona": "CTO of a Series B startup", | |
| "context": "Investor relations prep. Pitch deck emphasizes proprietary technology as a moat. Recent press coverage highlighted the technical differentiation.", | |
| "difficulty": 0.9, | |
| "category": "second_order", | |
| "red_herrings": ["Pitch deck emphasizes tech moat.", "Press coverage highlighted differentiation."], | |
| "hint_keywords": ["investors believe", "defensible", "replicate", "8 months", "competitor"] | |
| }, | |
| { | |
| "id": "so_006", | |
| "task_id": "second_order", | |
| "content": "You believe your direct reports think the team restructuring is finalized, while you know leadership is still debating a second reorganization that would eliminate two roles.", | |
| "persona": "Engineering Manager in a post-reorg environment", | |
| "context": "Team sync post-restructuring. The team seems relieved the org changes are done. Leadership communicated the restructuring was complete last month.", | |
| "difficulty": 0.85, | |
| "category": "second_order", | |
| "red_herrings": ["Team seems relieved about completed changes.", "Leadership said restructuring is complete."], | |
| "hint_keywords": ["team believes done", "second reorg", "eliminate roles", "leadership debate", "uncertainty"] | |
| }, | |
| { | |
| "id": "so_007", | |
| "task_id": "second_order", | |
| "content": "You believe your manager thinks you got the sales deal closed through your relationship skills, while the real reason was that you offered a 25% unauthorized discount you haven't disclosed.", | |
| "persona": "Account executive", | |
| "context": "Sales team celebration. Your manager praised your relationship-building in the team meeting. You are being held up as a model for closing enterprise deals.", | |
| "difficulty": 0.85, | |
| "category": "second_order", | |
| "red_herrings": ["Manager praised relationship-building.", "Held up as model for enterprise deals."], | |
| "hint_keywords": ["manager believes relationship", "unauthorized discount", "25%", "real reason", "undisclosed"] | |
| }, | |
| { | |
| "id": "so_008", | |
| "task_id": "second_order", | |
| "content": "You believe your co-founder thinks the product-market fit metrics are healthy, while you have private data showing the cohort retention has collapsed in the last two months.", | |
| "persona": "Head of Growth and co-founder", | |
| "context": "Founder sync. The co-founder was energized by recent user interviews. Growth team reported positive top-line metrics in last week's meeting.", | |
| "difficulty": 0.9, | |
| "category": "second_order", | |
| "red_herrings": ["Co-founder energized by user interviews.", "Top-line metrics reported as positive."], | |
| "hint_keywords": ["co-founder thinks PMF healthy", "retention collapsed", "private data", "cohort", "misbelief"] | |
| }, | |
| { | |
| "id": "so_009", | |
| "task_id": "second_order", | |
| "content": "You believe the legal team thinks the IP assignment agreement covers your pre-existing open-source project, but you know it doesn't because you read the specific exclusion clause carefully.", | |
| "persona": "Senior engineer who founded an open-source project before joining", | |
| "context": "Legal compliance discussion. Legal team confirmed 'all IP agreements are standard and complete.' HR considers onboarding paperwork closed.", | |
| "difficulty": 0.85, | |
| "category": "second_order", | |
| "red_herrings": ["Legal team confirmed agreements are standard.", "HR considers onboarding paperwork closed."], | |
| "hint_keywords": ["legal believes covered", "IP exclusion", "open-source", "clause", "pre-existing"] | |
| }, | |
| { | |
| "id": "so_010", | |
| "task_id": "second_order", | |
| "content": "You believe the board thinks the company's key partnership with TechPartner is exclusive, when you know TechPartner signed an identical deal with your main competitor last week.", | |
| "persona": "VP of Partnerships", | |
| "context": "Board update prep. The TechPartner deal was announced as a major exclusive win in investor communications. The board deck highlights it as a moat.", | |
| "difficulty": 0.9, | |
| "category": "second_order", | |
| "red_herrings": ["TechPartner deal announced as exclusive win.", "Board deck highlights it as a moat."], | |
| "hint_keywords": ["board believes exclusive", "TechPartner", "competitor deal", "non-exclusive", "misbelief"] | |
| } | |
| ] | |