|
| 1 | +const path = require('path'); |
| 2 | +const fs = require('fs'); |
| 3 | +const rootPath = path.join(__dirname, "..", "..", ".."); |
| 4 | +const evalPromptDir = path.join(rootPath, "evalprompt"); |
| 5 | +// collect results |
| 6 | +let commentContent = ''; |
| 7 | +const directories = fs.readdirSync(evalPromptDir, { withFileTypes: true }) |
| 8 | + .filter(dirent => dirent.isDirectory()) |
| 9 | + .map(dirent => dirent.name); |
| 10 | +console.log(directories); |
| 11 | +for (const dir of directories) { |
| 12 | + const outputFile = path.join(evalPromptDir, dir, 'output.json'); |
| 13 | + const baselineFile = path.join(evalPromptDir, dir, 'baseline.json'); |
| 14 | + if (outputFile == null || !fs.existsSync(outputFile)) |
| 15 | + continue; |
| 16 | + console.log(outputFile); |
| 17 | + const output = JSON.parse(fs.readFileSync(outputFile, 'utf8')); |
| 18 | + let body = ` LLM prompt result for ${dir} |
| 19 | +
|
| 20 | +| From | Success | Failure | Score | |
| 21 | +|---------|---------|---------|---------| |
| 22 | +| Output | ${output.results.stats.successes} | ${output.results.stats.failures} | ${output.results.prompts[0].metrics.score} | |
| 23 | +`; |
| 24 | + if (baselineFile && fs.existsSync(baselineFile)) { |
| 25 | + const baseline = JSON.parse(fs.readFileSync(baselineFile, 'utf8')); |
| 26 | + body += `|Baseline| ${baseline.success} | ${baseline.failure} | ${baseline.score} | |
| 27 | + ` |
| 28 | + if (baseline.successes < output.results.stats.successes || baseline.failures > output.results.stats.failures || baseline.score > output.results.prompts[0].metrics.score) { |
| 29 | + body = `[Not PASS]🚨 ` + body; |
| 30 | + } else { |
| 31 | + body = `[PASS]✅ ` + body; |
| 32 | + } |
| 33 | + } |
| 34 | + if (output.shareableUrl) { |
| 35 | + body = body.concat(`\n**» [View eval results](${output.shareableUrl}) «**\n`); |
| 36 | + } else { |
| 37 | + body = body.concat('\n**» View eval results in CI console «**\n'); |
| 38 | + } |
| 39 | + commentContent += body + "\n\n"; |
| 40 | +} |
| 41 | + |
| 42 | +fs.writeFileSync(path.join(rootPath, 'commentContent.txt'), commentContent, 'utf-8'); |
0 commit comments