|
45 | 45 | {"filepath":"/Users/alacolombiadev/Documents/code/teamxray/evals/real-analysis.eval.ts","name":"AI Expertise Analysis - Quality Check","score":null,"duration":0,"results":[],"startTime":"2025-11-24T20:29:44.991Z","sourceCodeHash":""} |
46 | 46 | {"filepath":"/Users/alacolombiadev/Documents/code/teamxray/evals/real-analysis.eval.ts","name":"File Expert Matching","score":1,"duration":49,"results":[{"input":{"filePath":"src/auth/login.ts","contributors":[{"name":"Alice Chen","commits":15,"lastEdit":"2025-11-20"},{"name":"Bob Martinez","commits":2,"lastEdit":"2025-10-15"}]},"result":{"filePath":"src/auth/login.ts","expertName":"Alice Chen","confidence":0.8823529411764706,"totalContributions":15},"expected":{"expert":"Alice Chen","confidenceThreshold":0.7},"scores":[{"name":"Expert Match Accuracy","score":1,"details":"Alice Chen (88% confidence)"},{"name":"Confidence Level","score":1,"details":"Confidence: 88%"}],"duration":2,"score":1,"traces":[]}],"startTime":"2025-11-24T20:29:44.991Z","sourceCodeHash":"b2f3533fbbd6a79dd6d724e4e1957bcff5bef7889ea25b44cba1fea1d4647e72"} |
47 | 47 | {"filepath":"/Users/alacolombiadev/Documents/code/teamxray/evals/real-analysis.eval.ts","name":"Collaboration Pattern Analysis","score":0.5833333333333333,"duration":49,"results":[{"input":{"commits":["Fixed bug in payment processing - thanks Alice for catching this!","Reviewed Bob's authentication PR - solid work","Pair programmed with Charlie on the new API endpoints","Merged feature after team discussion"]},"result":{"collaborationScore":1,"patterns":["gratitude/recognition","code review","pair programming","team collaboration","integration work"],"totalCommits":4,"collaborativeCommits":4},"expected":{"collaborationScore":0.75,"patterns":["code review","pair programming","team discussion"]},"scores":[{"name":"Collaboration Score Accuracy","score":0.5,"details":"Score: 100% (expected: 75%)"},{"name":"Pattern Detection","score":0.6666666666666666,"details":"Found 2/3 expected patterns"}],"duration":2,"score":0.5833333333333333,"traces":[]}],"startTime":"2025-11-24T20:29:44.991Z","sourceCodeHash":"b2f3533fbbd6a79dd6d724e4e1957bcff5bef7889ea25b44cba1fea1d4647e72"} |
| 48 | +{"startTime":"2025-11-24T22:19:51.715Z","type":"FULL_RUN_BEGIN"} |
| 49 | +{"filepath":"/Users/alacolombiadev/Documents/code/teamxray/evals/real-analysis.eval.ts","name":"AI Expertise Analysis - Quality Check","score":1,"duration":1,"results":[{"input":{"repositoryData":{"contributors":[{"name":"Alice Chen","email":" [email protected]","commits":245,"additions":15230,"deletions":8420},{"name":"Bob Martinez","email":" [email protected]","commits":156,"additions":9840,"deletions":4210}],"commits":[{"author":"Alice Chen","message":"Refactor authentication system with improved security","date":"2025-11-20","files":["src/auth/login.ts","src/auth/security.ts"]},{"author":"Alice Chen","message":"Code review: Helped Bob with async/await patterns","date":"2025-11-19","files":[]},{"author":"Bob Martinez","message":"Add React dashboard components with TypeScript","date":"2025-11-18","files":["src/ui/Dashboard.tsx","src/ui/Charts.tsx"]}],"fileChanges":{"src/auth/login.ts":["Alice Chen"],"src/auth/security.ts":["Alice Chen"],"src/ui/Dashboard.tsx":["Bob Martinez"],"src/ui/Charts.tsx":["Bob Martinez"]}}},"result":{"topExpert":"Alice Chen","totalContributors":2,"hasMentoringBehavior":true,"specializations":["Authentication","Security","React","TypeScript"],"humanInsights":["Alice Chen shows mentoring behavior through code reviews and helping teammates","Alice Chen demonstrates deep expertise with 245 meaningful contributions"],"communicationStyle":"Collaborative and supportive"},"expected":{"topExpertName":"Alice Chen","detectsMentoring":true,"identifiesSpecializations":true,"humanInsights":true},"scores":[{"name":"Top Expert Identification","score":1,"details":"Identified: Alice Chen (expected: Alice Chen)"},{"name":"Mentoring Pattern Detection","score":1,"details":"Detected mentoring: ✓"},{"name":"Specialization Detection","score":1,"details":"Found specializations: Authentication, Security, React, TypeScript"},{"name":"Human Insights Quality","score":1,"details":"Generated 2 insights"}],"duration":1,"score":1,"traces":[]}],"startTime":"2025-11-24T22:19:51.786Z","sourceCodeHash":"b2f3533fbbd6a79dd6d724e4e1957bcff5bef7889ea25b44cba1fea1d4647e72"} |
| 50 | +{"filepath":"/Users/alacolombiadev/Documents/code/teamxray/evals/real-analysis.eval.ts","name":"File Expert Matching","score":1,"duration":0,"results":[{"input":{"filePath":"src/auth/login.ts","contributors":[{"name":"Alice Chen","commits":15,"lastEdit":"2025-11-20"},{"name":"Bob Martinez","commits":2,"lastEdit":"2025-10-15"}]},"result":{"filePath":"src/auth/login.ts","expertName":"Alice Chen","confidence":0.8823529411764706,"totalContributions":15},"expected":{"expert":"Alice Chen","confidenceThreshold":0.7},"scores":[{"name":"Expert Match Accuracy","score":1,"details":"Alice Chen (88% confidence)"},{"name":"Confidence Level","score":1,"details":"Confidence: 88%"}],"duration":0,"score":1,"traces":[]}],"startTime":"2025-11-24T22:19:51.786Z","sourceCodeHash":"b2f3533fbbd6a79dd6d724e4e1957bcff5bef7889ea25b44cba1fea1d4647e72"} |
| 51 | +{"filepath":"/Users/alacolombiadev/Documents/code/teamxray/evals/real-analysis.eval.ts","name":"Collaboration Pattern Analysis","score":0.5833333333333333,"duration":0,"results":[{"input":{"commits":["Fixed bug in payment processing - thanks Alice for catching this!","Reviewed Bob's authentication PR - solid work","Pair programmed with Charlie on the new API endpoints","Merged feature after team discussion"]},"result":{"collaborationScore":1,"patterns":["gratitude/recognition","code review","pair programming","team collaboration","integration work"],"totalCommits":4,"collaborativeCommits":4},"expected":{"collaborationScore":0.75,"patterns":["code review","pair programming","team discussion"]},"scores":[{"name":"Collaboration Score Accuracy","score":0.5,"details":"Score: 100% (expected: 75%)"},{"name":"Pattern Detection","score":0.6666666666666666,"details":"Found 2/3 expected patterns"}],"duration":0,"score":0.5833333333333333,"traces":[]}],"startTime":"2025-11-24T22:19:51.786Z","sourceCodeHash":"b2f3533fbbd6a79dd6d724e4e1957bcff5bef7889ea25b44cba1fea1d4647e72"} |
| 52 | +{"filepath":"/Users/alacolombiadev/Documents/code/teamxray/evals/starter.eval.ts","name":"Expert Identification - Basic","score":1,"duration":0,"results":[{"input":{"contributors":[{"name":"Alice Dev","commits":150},{"name":"Bob Engineer","commits":85},{"name":"Charlie Coder","commits":45}]},"result":{"topExpert":"Alice Dev","totalExperts":3,"expertiseScores":[{"name":"Alice Dev","score":100},{"name":"Bob Engineer","score":56.666666666666664},{"name":"Charlie Coder","score":30}]},"expected":{"topExpert":"Alice Dev","totalExperts":3},"scores":[{"name":"Top Expert Accuracy","score":1,"details":"✓ Correctly identified Alice Dev"},{"name":"Expert Count","score":1,"details":"Found 3 experts (expected: 3)"}],"duration":0,"score":1,"traces":[]},{"input":{"contributors":[{"name":"Sarah Smith","commits":200}]},"result":{"topExpert":"Sarah Smith","totalExperts":1,"expertiseScores":[{"name":"Sarah Smith","score":100}]},"expected":{"topExpert":"Sarah Smith","totalExperts":1},"scores":[{"name":"Top Expert Accuracy","score":1,"details":"✓ Correctly identified Sarah Smith"},{"name":"Expert Count","score":1,"details":"Found 1 experts (expected: 1)"}],"duration":0,"score":1,"traces":[]}],"startTime":"2025-11-24T22:19:51.786Z","sourceCodeHash":"b2f3533fbbd6a79dd6d724e4e1957bcff5bef7889ea25b44cba1fea1d4647e72"} |
| 53 | +{"filepath":"/Users/alacolombiadev/Documents/code/teamxray/evals/starter.eval.ts","name":"Team Collaboration Detection","score":1,"duration":0,"results":[{"input":{"commits":["Fixed bug in payment processor","Reviewed Alice's PR - looks good!","Merged feature branch after testing"]},"result":{"hasCollaboration":true,"patterns":["review","merge"]},"expected":{"hasCollaboration":true},"scores":[{"name":"Collaboration Detection","score":1,"details":"Detected patterns: review, merge"}],"duration":0,"score":1,"traces":[]}],"startTime":"2025-11-24T22:19:51.786Z","sourceCodeHash":"b2f3533fbbd6a79dd6d724e4e1957bcff5bef7889ea25b44cba1fea1d4647e72"} |
0 commit comments