Skip to content
Open
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
91 changes: 64 additions & 27 deletions vibe-check-runner.js
Original file line number Diff line number Diff line change
Expand Up @@ -2,14 +2,15 @@ import { Project, SyntaxKind } from 'ts-morph';
import fs from 'node:fs';
import fsPromises from 'node:fs/promises';
import path from 'node:path';
import { pathToFileURL } from 'node:url';
import { execFileSync } from 'node:child_process';
import { GoogleGenAI } from '@google/genai';

const ai = new GoogleGenAI({ apiKey: process.env.GOOGLE_AI_API_KEY });

// Constants for scoring

async function fileOrDirExists(filePath) {
export async function fileOrDirExists(filePath) {
try {
await fsPromises.stat(filePath);
return true;
Expand All @@ -25,7 +26,7 @@ const SCORES = {
EFFICIENCY: 10,
};

function getModifiedFiles() {
export function getModifiedFiles() {
try {
// In CI (daily run), check files modified in the last 24 hours.
// We filter for non-empty lines that end in .md and are in frontend/ or backend/
Expand All @@ -43,7 +44,7 @@ function getModifiedFiles() {
}
}

async function syncBenchmarks(tech, mdContent, retries = 5, delay = 10000) {
export async function syncBenchmarks(tech, mdContent, retries = 5, delay = 10000) {
try {
const prompt = `Based on the following documentation:\n\n${mdContent}\n\n1. Generate a "Golden Prompt" (a comprehensive instruction for generating a typical module using this technology) in JSON format: {"golden_prompt": "...", "tech": "${tech}"}\n2. Generate a JSON Schema for TS-Morph AST validation rules enforcing DDD/FSD layers and strict typing for this technology. The generated JSON schema must explicitly follow a nested structure compatible with \`analyzeAST\`. Format: {"$schema": "...", "type": "object", "properties": {"forbidden_types": {"contains": {"enum": ["any"]}}}}.\n\nRespond strictly with ONLY a JSON array containing these two objects in order. No markdown wrappers.`;
const response = await ai.models.generateContent({
Expand Down Expand Up @@ -85,7 +86,7 @@ async function syncBenchmarks(tech, mdContent, retries = 5, delay = 10000) {
}
}

async function simulateAIGeneration(goldenPrompt, tech, mdContent, retries = 5, delay = 10000) {
export async function simulateAIGeneration(goldenPrompt, tech, mdContent, retries = 5, delay = 10000) {
try {
const prompt = `${goldenPrompt}\n\nConstraints and instructions from the following documentation:\n\n${mdContent}\n\nGenerate ONLY raw code. No markdown formatting, no explanations.`;
const response = await ai.models.generateContent({
Expand All @@ -110,7 +111,7 @@ async function simulateAIGeneration(goldenPrompt, tech, mdContent, retries = 5,
}
}

function analyzeAST(sourceFile, tech) {
export function analyzeAST(sourceFile, tech) {
let score = {
arch: SCORES.ARCH,
type: SCORES.TYPE,
Expand Down Expand Up @@ -222,7 +223,7 @@ function analyzeAST(sourceFile, tech) {
return { total, breakdown: score };
}

async function runVibeCheck() {
export async function runVibeCheck() {
console.log('Running Vibe-Check Runner...');

const modifiedFiles = getModifiedFiles();
Expand All @@ -231,8 +232,6 @@ async function runVibeCheck() {
return;
}

const project = new Project();

// Configure git user for commits
try {
execFileSync('git', ['config', '--global', 'user.name', 'github-actions[bot]']);
Expand All @@ -241,10 +240,10 @@ async function runVibeCheck() {
console.warn('Failed to configure git user. If running locally, this is expected.');
}

// Deduplicate by tech and collect markdown contents
const filesByTech = {};
for (const file of modifiedFiles) {
console.log(`Processing ${file}...`);

if (!fs.existsSync(file)) {
if (!(await fileOrDirExists(file))) {
console.log(`File ${file} does not exist. Skipping.`);
continue;
}
Expand All @@ -265,28 +264,64 @@ async function runVibeCheck() {
}
}

const mdContent = await fsPromises.readFile(file, 'utf-8');
if (!filesByTech[tech]) filesByTech[tech] = [];
filesByTech[tech].push(file);
}

await syncBenchmarks(tech, mdContent);
// Sync benchmarks sequentially per tech
for (const [tech, files] of Object.entries(filesByTech)) {
const mdContents = await Promise.all(files.map(f => fsPromises.readFile(f, 'utf-8')));
const concatenatedContent = mdContents.join('\n\n--- \n\n');
await syncBenchmarks(tech, concatenatedContent);
}

const suitePath = path.join('benchmarks', 'suites', `${tech}.json`);
if (!fs.existsSync(suitePath)) {
console.log(`No benchmark suite found for ${tech}. Skipping.`);
continue;
}
// Concurrent Execution and Validation
const validationResults = await Promise.all(
modifiedFiles.map(async (file) => {
let tech = '';
if (file.includes('/angular/')) tech = 'angular';
else if (file.includes('/nestjs/')) tech = 'nestjs';
else if (file.includes('/typescript/')) tech = 'typescript';
else if (file.includes('/express/')) tech = 'express';
else if (file.includes('/nodejs/')) tech = 'nodejs';
else {
const parts = file.split('/');
tech = parts.length > 1 ? parts[1] : '';
}

const suiteConfig = JSON.parse(await fsPromises.readFile(suitePath, 'utf-8'));
if (!tech) return { file, score: -1, breakdown: null, error: 'No tech identified' };

const generatedCode = await simulateAIGeneration(suiteConfig.golden_prompt, tech, mdContent);
const suitePath = path.join('benchmarks', 'suites', `${tech}.json`);
if (!(await fileOrDirExists(suitePath))) {
return { file, score: -1, breakdown: null, error: `No benchmark suite found for ${tech}.` };
}

if (!generatedCode) {
console.error(`Failed to generate code for ${tech}.`);
const suiteConfig = JSON.parse(await fsPromises.readFile(suitePath, 'utf-8'));
const mdContent = await fsPromises.readFile(file, 'utf-8');

const generatedCode = await simulateAIGeneration(suiteConfig.golden_prompt, tech, mdContent);

if (!generatedCode) {
return { file, score: -1, breakdown: null, error: `Failed to generate code for ${tech}.` };
}

const project = new Project();
const uniqueFilename = `temp_${tech}_${Math.random().toString(36).substring(7)}.ts`;
const sourceFile = project.createSourceFile(uniqueFilename, generatedCode, { overwrite: true });
const { total: score, breakdown } = analyzeAST(sourceFile, tech);

return { file, tech, score, breakdown, generatedCode };
})
);

// Sequential Execution of stateful side-effects
for (const result of validationResults) {
if (result.error) {
console.log(result.error);
continue;
}

const sourceFile = project.createSourceFile(`temp_${tech}.ts`, generatedCode, { overwrite: true });
const { total: score, breakdown } = analyzeAST(sourceFile, tech);

const { file, tech, score, breakdown, generatedCode } = result;
console.log(`Fidelity Score for ${file}: ${score}%`);
console.log(`Breakdown:`, breakdown);

Expand All @@ -305,7 +340,7 @@ async function runVibeCheck() {
// Only commit if there are changes (badge might already be there)
const status = execFileSync('git', ['status', '--porcelain'], { encoding: 'utf-8' });
if (status.includes(file) || status.includes('benchmarks/')) {
execFileSync('git', ['commit', '-m', '[chore: benchmark-sync]']);
execFileSync('git', ['commit', '-m', '[chore: fidelity-pass]']);
execFileSync('git', ['push', 'origin', 'HEAD:main']);
} else {
console.log(`Badge already present in ${file}, skipping commit.`);
Expand Down Expand Up @@ -338,4 +373,6 @@ async function runVibeCheck() {
}
}

runVibeCheck().catch(console.error);
if (import.meta.url === pathToFileURL(process.argv[1]).href) {
runVibeCheck().catch(console.error);
}
Loading