<?xml version="1.0" encoding="UTF-8"?>
<rss version="2.0" xmlns:atom="http://www.w3.org/2005/Atom" xmlns:dc="http://purl.org/dc/elements/1.1/">
  <channel>
    <title>Forem: Dipesh Ray</title>
    <description>The latest articles on Forem by Dipesh Ray (@dipeshrayg).</description>
    <link>https://forem.com/dipeshrayg</link>
    <image>
      <url>https://media2.dev.to/dynamic/image/width=90,height=90,fit=cover,gravity=auto,format=auto/https:%2F%2Fdev-to-uploads.s3.amazonaws.com%2Fuploads%2Fuser%2Fprofile_image%2F3939021%2Fcfde8f94-8882-4bc7-9746-c3fb68cf4867.jpeg</url>
      <title>Forem: Dipesh Ray</title>
      <link>https://forem.com/dipeshrayg</link>
    </image>
    <atom:link rel="self" type="application/rss+xml" href="https://forem.com/feed/dipeshrayg"/>
    <language>en</language>
    <item>
      <title>This is an Autonomous Brain.</title>
      <dc:creator>Dipesh Ray</dc:creator>
      <pubDate>Tue, 19 May 2026 10:34:46 +0000</pubDate>
      <link>https://forem.com/dipeshrayg/this-is-an-autonomous-brain-1jif</link>
      <guid>https://forem.com/dipeshrayg/this-is-an-autonomous-brain-1jif</guid>
      <description>&lt;div class="ltag__link--embedded"&gt;
  &lt;div class="crayons-story "&gt;
  &lt;a href="https://dev.to/dipeshrayg/multi-agent-ai-developer-4g7o" class="crayons-story__hidden-navigation-link"&gt;Multi-Agent AI developer&lt;/a&gt;


  &lt;div class="crayons-story__body crayons-story__body-full_post"&gt;
    &lt;div class="crayons-story__top"&gt;
      &lt;div class="crayons-story__meta"&gt;
        &lt;div class="crayons-story__author-pic"&gt;

          &lt;a href="/dipeshrayg" class="crayons-avatar  crayons-avatar--l  "&gt;
            &lt;img src="https://media2.dev.to/dynamic/image/width=800%2Cheight=%2Cfit=scale-down%2Cgravity=auto%2Cformat=auto/https%3A%2F%2Fdev-to-uploads.s3.amazonaws.com%2Fuploads%2Fuser%2Fprofile_image%2F3939021%2Fcfde8f94-8882-4bc7-9746-c3fb68cf4867.jpeg" alt="dipeshrayg profile" class="crayons-avatar__image" width="460" height="460"&gt;
          &lt;/a&gt;
        &lt;/div&gt;
        &lt;div&gt;
          &lt;div&gt;
            &lt;a href="/dipeshrayg" class="crayons-story__secondary fw-medium m:hidden"&gt;
              Dipesh Ray
            &lt;/a&gt;
            &lt;div class="profile-preview-card relative mb-4 s:mb-0 fw-medium hidden m:inline-block"&gt;
              
                Dipesh Ray
                
              
              &lt;div id="story-author-preview-content-3695963" class="profile-preview-card__content crayons-dropdown branded-7 p-4 pt-0"&gt;
                &lt;div class="gap-4 grid"&gt;
                  &lt;div class="-mt-4"&gt;
                    &lt;a href="/dipeshrayg" class="flex"&gt;
                      &lt;span class="crayons-avatar crayons-avatar--xl mr-2 shrink-0"&gt;
                        &lt;img src="https://media2.dev.to/dynamic/image/width=800%2Cheight=%2Cfit=scale-down%2Cgravity=auto%2Cformat=auto/https%3A%2F%2Fdev-to-uploads.s3.amazonaws.com%2Fuploads%2Fuser%2Fprofile_image%2F3939021%2Fcfde8f94-8882-4bc7-9746-c3fb68cf4867.jpeg" class="crayons-avatar__image" alt="" width="460" height="460"&gt;
                      &lt;/span&gt;
                      &lt;span class="crayons-link crayons-subtitle-2 mt-5"&gt;Dipesh Ray&lt;/span&gt;
                    &lt;/a&gt;
                  &lt;/div&gt;
                  &lt;div class="print-hidden"&gt;
                    
                      Follow
                    
                  &lt;/div&gt;
                  &lt;div class="author-preview-metadata-container"&gt;&lt;/div&gt;
                &lt;/div&gt;
              &lt;/div&gt;
            &lt;/div&gt;

          &lt;/div&gt;
          &lt;a href="https://dev.to/dipeshrayg/multi-agent-ai-developer-4g7o" class="crayons-story__tertiary fs-xs"&gt;&lt;time&gt;May 18&lt;/time&gt;&lt;span class="time-ago-indicator-initial-placeholder"&gt;&lt;/span&gt;&lt;/a&gt;
        &lt;/div&gt;
      &lt;/div&gt;

    &lt;/div&gt;

    &lt;div class="crayons-story__indention"&gt;
      &lt;h2 class="crayons-story__title crayons-story__title-full_post"&gt;
        &lt;a href="https://dev.to/dipeshrayg/multi-agent-ai-developer-4g7o" id="article-link-3695963"&gt;
          Multi-Agent AI developer
        &lt;/a&gt;
      &lt;/h2&gt;
        &lt;div class="crayons-story__tags"&gt;
            &lt;a class="crayons-tag  crayons-tag--monochrome " href="/t/ai"&gt;&lt;span class="crayons-tag__prefix"&gt;#&lt;/span&gt;ai&lt;/a&gt;
            &lt;a class="crayons-tag  crayons-tag--monochrome " href="/t/webdev"&gt;&lt;span class="crayons-tag__prefix"&gt;#&lt;/span&gt;webdev&lt;/a&gt;
            &lt;a class="crayons-tag  crayons-tag--monochrome " href="/t/productivity"&gt;&lt;span class="crayons-tag__prefix"&gt;#&lt;/span&gt;productivity&lt;/a&gt;
            &lt;a class="crayons-tag  crayons-tag--monochrome " href="/t/programming"&gt;&lt;span class="crayons-tag__prefix"&gt;#&lt;/span&gt;programming&lt;/a&gt;
        &lt;/div&gt;
      &lt;div class="crayons-story__bottom"&gt;
        &lt;div class="crayons-story__details"&gt;
          &lt;a href="https://dev.to/dipeshrayg/multi-agent-ai-developer-4g7o" class="crayons-btn crayons-btn--s crayons-btn--ghost crayons-btn--icon-left"&gt;
            &lt;div class="multiple_reactions_aggregate"&gt;
              &lt;span class="multiple_reactions_icons_container"&gt;
                  &lt;span class="crayons_icon_container"&gt;
                    &lt;img src="https://assets.dev.to/assets/sparkle-heart-5f9bee3767e18deb1bb725290cb151c25234768a0e9a2bd39370c382d02920cf.svg" width="24" height="24"&gt;
                  &lt;/span&gt;
              &lt;/span&gt;
              &lt;span class="aggregate_reactions_counter"&gt;1&lt;span class="hidden s:inline"&gt; reaction&lt;/span&gt;&lt;/span&gt;
            &lt;/div&gt;
          &lt;/a&gt;
            &lt;a href="https://dev.to/dipeshrayg/multi-agent-ai-developer-4g7o#comments" class="crayons-btn crayons-btn--s crayons-btn--ghost crayons-btn--icon-left flex items-center"&gt;
              Comments


              &lt;span class="hidden s:inline"&gt;Add Comment&lt;/span&gt;
            &lt;/a&gt;
        &lt;/div&gt;
        &lt;div class="crayons-story__save"&gt;
          &lt;small class="crayons-story__tertiary fs-xs mr-2"&gt;
            5 min read
          &lt;/small&gt;
            
              &lt;span class="bm-initial"&gt;
                

              &lt;/span&gt;
              &lt;span class="bm-success"&gt;
                

              &lt;/span&gt;
            
        &lt;/div&gt;
      &lt;/div&gt;
    &lt;/div&gt;
  &lt;/div&gt;
&lt;/div&gt;

&lt;/div&gt;


</description>
    </item>
    <item>
      <title>Multi-Agent AI developer</title>
      <dc:creator>Dipesh Ray</dc:creator>
      <pubDate>Mon, 18 May 2026 22:36:31 +0000</pubDate>
      <link>https://forem.com/dipeshrayg/multi-agent-ai-developer-4g7o</link>
      <guid>https://forem.com/dipeshrayg/multi-agent-ai-developer-4g7o</guid>
      <description>&lt;h1&gt;
  
  
  I Built a Multi-Agent AI Boardroom That Ships Software on Its Own — For Free
&lt;/h1&gt;

&lt;p&gt;&lt;em&gt;How I designed an autonomous LLM pipeline with a CEO, security officer, and QA team that produces real, browser-runnable projects up to 5 times a day — running entirely on GitHub Models.&lt;/em&gt;&lt;/p&gt;




&lt;h2&gt;
  
  
  The Idea
&lt;/h2&gt;

&lt;p&gt;What if an AI system could not just write code, but manage the entire software engineering process itself?&lt;/p&gt;

&lt;p&gt;Not a single model generating code. A &lt;strong&gt;hierarchy of specialised agents&lt;/strong&gt; — each with a defined role, authority, and scope — collaborating like a real engineering organisation.&lt;/p&gt;

&lt;p&gt;That's what &lt;code&gt;autonomous-brain&lt;/code&gt; is.&lt;/p&gt;

&lt;p&gt;It's a self-improving AI software-engineering pipeline. A boardroom of LLMs that autonomously designs, builds, security-reviews, and publishes brand-new browser-runnable projects — several times a day. Each one more complex than the last.&lt;/p&gt;

&lt;p&gt;&lt;strong&gt;Live dashboard:&lt;/strong&gt; &lt;a href="https://dipeshrayg.github.io/autonomous-brain/" rel="noopener noreferrer"&gt;dipeshrayg.github.io/autonomous-brain&lt;/a&gt;&lt;br&gt;&lt;br&gt;
&lt;strong&gt;Cost to run:&lt;/strong&gt; $0 — powered entirely by GitHub Models.&lt;/p&gt;




&lt;h2&gt;
  
  
  The Architecture: An AI Boardroom
&lt;/h2&gt;

&lt;p&gt;The key design decision was &lt;strong&gt;role separation&lt;/strong&gt;. Most AI coding tools use one model doing everything. That produces mediocre generalist output. I wanted specialist agents that could critique each other.&lt;/p&gt;

&lt;p&gt;Here's how the hierarchy works:&lt;/p&gt;

&lt;h3&gt;
  
  
  Strategic Layer (Long-Horizon Decisions)
&lt;/h3&gt;

&lt;p&gt;&lt;strong&gt;CEO&lt;/strong&gt; — &lt;code&gt;gpt-4o&lt;/code&gt;, fires every 6 hours&lt;br&gt;&lt;br&gt;
Reviews the trajectory of recent projects. Issues strict directives: "stop building visualisers, explore simulation systems." The pipeline must obey.&lt;/p&gt;

&lt;p&gt;&lt;strong&gt;CSO (Chief Security Officer)&lt;/strong&gt; — &lt;code&gt;gpt-4o&lt;/code&gt;, fires every 12 hours&lt;br&gt;&lt;br&gt;
Audits security posture across recent output. Issues directives like "all projects must sanitise user input" or "avoid eval()." These flow into every subsequent build.&lt;/p&gt;

&lt;h3&gt;
  
  
  Execution Layer (Per-Project)
&lt;/h3&gt;

&lt;p&gt;&lt;strong&gt;VP Engineering&lt;/strong&gt; — fires every 15 minutes&lt;br&gt;&lt;br&gt;
Decides whether a new project should be dispatched. Acts as a watchdog, enforcing cadence and complexity targets.&lt;/p&gt;

&lt;p&gt;&lt;strong&gt;Architect Candidates&lt;/strong&gt; — &lt;code&gt;gpt-4o-mini&lt;/code&gt; + &lt;code&gt;Phi-3.5-MoE&lt;/code&gt; in parallel&lt;br&gt;&lt;br&gt;
Two models independently propose project designs. Competition produces better ideas than a single proposal.&lt;/p&gt;

&lt;p&gt;&lt;strong&gt;Chief Architect / Judge&lt;/strong&gt; — &lt;code&gt;gpt-4o&lt;/code&gt;&lt;br&gt;&lt;br&gt;
Reads both proposals, synthesises the strongest elements, and produces the final design spec. No rubber-stamping — it genuinely chooses.&lt;/p&gt;

&lt;p&gt;&lt;strong&gt;Engineers&lt;/strong&gt; — &lt;code&gt;gpt-4o&lt;/code&gt;, one LLM call per file&lt;br&gt;&lt;br&gt;
Implement the spec. Each file is a separate call, keeping context focused and output quality high.&lt;/p&gt;

&lt;p&gt;&lt;strong&gt;Code Reviewers&lt;/strong&gt; — &lt;code&gt;gpt-4o-mini&lt;/code&gt; + &lt;code&gt;Phi-3.5-MoE&lt;/code&gt; in parallel&lt;br&gt;&lt;br&gt;
Two independent reviewers critique the output simultaneously. Results are merged.&lt;/p&gt;

&lt;p&gt;&lt;strong&gt;Security Officer&lt;/strong&gt; — &lt;code&gt;gpt-4o&lt;/code&gt;&lt;br&gt;&lt;br&gt;
A hard gate. If the project has critical or high severity findings, it does not publish. No exceptions.&lt;/p&gt;

&lt;p&gt;&lt;strong&gt;Fixer / Polisher&lt;/strong&gt; — &lt;code&gt;gpt-4o-mini&lt;/code&gt;&lt;br&gt;&lt;br&gt;
Applies reviewer feedback and runs a final polish pass before QA.&lt;/p&gt;

&lt;p&gt;&lt;strong&gt;QA&lt;/strong&gt; — Playwright + Chromium&lt;br&gt;&lt;br&gt;
Mechanical headless-browser verification. The project must load and pass basic interaction checks or it gets flagged.&lt;/p&gt;




&lt;h2&gt;
  
  
  Why Multi-Agent Instead of One Big Prompt?
&lt;/h2&gt;

&lt;p&gt;Single-model approaches have a ceiling. When you ask one model to design, implement, review, and secure a project in one pass, context pollution degrades quality at every stage.&lt;/p&gt;

&lt;p&gt;Multi-agent separation solves this:&lt;/p&gt;

&lt;ol&gt;
&lt;li&gt;
&lt;strong&gt;Fresh context per role&lt;/strong&gt; — the Security Officer reads the finished code, not the design discussion. It sees what a real attacker would see.&lt;/li&gt;
&lt;li&gt;
&lt;strong&gt;Adversarial review&lt;/strong&gt; — two Architect Candidates competing produces better designs than one model agreeing with itself.&lt;/li&gt;
&lt;li&gt;
&lt;strong&gt;Hierarchy enforces consistency&lt;/strong&gt; — CEO directives propagate down. The system doesn't just build random things. It has a direction.&lt;/li&gt;
&lt;li&gt;
&lt;strong&gt;Specialised models where appropriate&lt;/strong&gt; — &lt;code&gt;gpt-4o-mini&lt;/code&gt; is fast and cheap for parallel review passes. &lt;code&gt;gpt-4o&lt;/code&gt; is reserved for judgement calls.&lt;/li&gt;
&lt;/ol&gt;




&lt;h2&gt;
  
  
  Self-Improvement: How the Complexity Grows
&lt;/h2&gt;

&lt;p&gt;Each project is assigned a complexity score. The system tracks this over time.&lt;/p&gt;

&lt;p&gt;The CEO reviews recent complexity trends. If projects are getting simpler or stagnating, it issues a directive forcing the next Architect to push harder.&lt;/p&gt;

&lt;p&gt;Currently:&lt;/p&gt;

&lt;ul&gt;
&lt;li&gt;&lt;strong&gt;28 projects shipped&lt;/strong&gt;&lt;/li&gt;
&lt;li&gt;
&lt;strong&gt;Peak complexity:&lt;/strong&gt; 43 (open-ended scale)&lt;/li&gt;
&lt;li&gt;
&lt;strong&gt;Average complexity:&lt;/strong&gt; 21.5&lt;/li&gt;
&lt;/ul&gt;

&lt;p&gt;The system genuinely trends upward. Early projects were simple visualisers. Recent ones include multi-agent simulations, healthcare dashboards, and adaptive AI strategy games.&lt;/p&gt;




&lt;h2&gt;
  
  
  Running for Free: GitHub Models
&lt;/h2&gt;

&lt;p&gt;Every model in this pipeline runs on &lt;strong&gt;GitHub Models&lt;/strong&gt; — a free tier that gives access to &lt;code&gt;gpt-4o&lt;/code&gt;, &lt;code&gt;gpt-4o-mini&lt;/code&gt;, and open models like &lt;code&gt;Phi-3.5-MoE&lt;/code&gt; via a standard OpenAI-compatible API.&lt;/p&gt;

&lt;p&gt;No credit card. No rate limit issues at this scale. The only cost is the GitHub Actions runner time, which is also free within limits.&lt;/p&gt;

&lt;p&gt;This means the entire system — from CEO strategic review to Playwright QA — costs $0 to run.&lt;/p&gt;




&lt;h2&gt;
  
  
  What It Has Built So Far
&lt;/h2&gt;

&lt;p&gt;In 28 runs, the system has shipped projects across:&lt;/p&gt;

&lt;ul&gt;
&lt;li&gt;
&lt;strong&gt;Mathematics&lt;/strong&gt; — differential equation visualisers, fractal explorers&lt;/li&gt;
&lt;li&gt;
&lt;strong&gt;Healthcare&lt;/strong&gt; — simulation dashboards, resource allocation tools&lt;/li&gt;
&lt;li&gt;
&lt;strong&gt;Environmental Science&lt;/strong&gt; — climate data explorers&lt;/li&gt;
&lt;li&gt;
&lt;strong&gt;Arts&lt;/strong&gt; — generative art engines, emergent pattern systems&lt;/li&gt;
&lt;li&gt;
&lt;strong&gt;Cybersecurity&lt;/strong&gt; — visual cryptography tools, cipher simulators&lt;/li&gt;
&lt;li&gt;
&lt;strong&gt;Bioinformatics&lt;/strong&gt; — sequence analysis tools&lt;/li&gt;
&lt;li&gt;
&lt;strong&gt;Game Design&lt;/strong&gt; — adaptive AI strategy games&lt;/li&gt;
&lt;li&gt;
&lt;strong&gt;History&lt;/strong&gt; — interactive timelines&lt;/li&gt;
&lt;/ul&gt;

&lt;p&gt;Every single one is a browser-runnable project with a one-click demo. No setup. No dependencies. Open the link, it runs.&lt;/p&gt;




&lt;h2&gt;
  
  
  What I Learned
&lt;/h2&gt;

&lt;p&gt;&lt;strong&gt;1. Role design is the hardest part.&lt;/strong&gt;&lt;br&gt;&lt;br&gt;
Deciding what each agent knows, when it fires, and what authority it has took more iteration than any code. Get the roles wrong and agents either duplicate work or conflict.&lt;/p&gt;

&lt;p&gt;&lt;strong&gt;2. Hard gates matter.&lt;/strong&gt;&lt;br&gt;&lt;br&gt;
The Security Officer's hard veto was the best decision I made. Without it, the system published insecure projects that looked fine on the surface. The gate changed the architecture of subsequent projects — engineers started writing more defensively because they knew the gate existed.&lt;/p&gt;

&lt;p&gt;&lt;strong&gt;3. Parallelism is underused in AI pipelines.&lt;/strong&gt;&lt;br&gt;&lt;br&gt;
Running two Architect Candidates and two Code Reviewers in parallel added almost no latency (async calls) but meaningfully improved output quality. The Judge step pays for itself.&lt;/p&gt;

&lt;p&gt;&lt;strong&gt;4. Complexity targets need a mechanism, not just a prompt.&lt;/strong&gt;&lt;br&gt;&lt;br&gt;
Telling a model "make it more complex" doesn't work. Giving the CEO a tracked metric and authority to issue directives based on it does.&lt;/p&gt;




&lt;h2&gt;
  
  
  What's Next
&lt;/h2&gt;

&lt;ul&gt;
&lt;li&gt;
&lt;strong&gt;Memory across projects&lt;/strong&gt; — the CEO currently reviews recent output but doesn't have a long-term memory of what patterns have been overused globally&lt;/li&gt;
&lt;li&gt;
&lt;strong&gt;Engineer specialisation&lt;/strong&gt; — specialist engineer agents for frontend, backend, and security rather than generalist engineers per file&lt;/li&gt;
&lt;li&gt;
&lt;strong&gt;Contributor mode&lt;/strong&gt; — allowing external prompts to influence CEO directives&lt;/li&gt;
&lt;li&gt;
&lt;strong&gt;Open source the engine&lt;/strong&gt; — &lt;code&gt;autonomous-brain-engine&lt;/code&gt; (the Python orchestrator) will be open-sourced once I've cleaned the API key handling&lt;/li&gt;
&lt;/ul&gt;




&lt;h2&gt;
  
  
  Try It
&lt;/h2&gt;

&lt;p&gt;&lt;strong&gt;Dashboard (all 28 projects, live demos):&lt;/strong&gt; &lt;a href="https://dipeshrayg.github.io/autonomous-brain/" rel="noopener noreferrer"&gt;dipeshrayg.github.io/autonomous-brain&lt;/a&gt;&lt;br&gt;&lt;br&gt;
&lt;strong&gt;GitHub:&lt;/strong&gt; &lt;a href="https://github.com/dipeshrayg/autonomous-brain" rel="noopener noreferrer"&gt;github.com/dipeshrayg/autonomous-brain&lt;/a&gt;&lt;/p&gt;

&lt;p&gt;If you build something inspired by this or have questions about the architecture, I'm &lt;a href="https://dev.to/dipeshray"&gt;@dipeshray on Dev.to&lt;/a&gt; — happy to discuss.&lt;/p&gt;




&lt;p&gt;&lt;em&gt;I'm a Computing Systems student in London working on autonomous AI systems and applied cryptography. This is part of my ongoing work on multi-agent architectures.&lt;/em&gt;&lt;/p&gt;




&lt;p&gt;&lt;strong&gt;Tags:&lt;/strong&gt; &lt;code&gt;ai&lt;/code&gt; &lt;code&gt;machinelearning&lt;/code&gt; &lt;code&gt;opensource&lt;/code&gt; &lt;code&gt;python&lt;/code&gt; &lt;code&gt;beginners&lt;/code&gt;&lt;/p&gt;

&lt;p&gt;&lt;a href="https://media2.dev.to/dynamic/image/width=800%2Cheight=%2Cfit=scale-down%2Cgravity=auto%2Cformat=auto/https%3A%2F%2Fdev-to-uploads.s3.amazonaws.com%2Fuploads%2Farticles%2Fz24jhyln4y5lc8jl2h0l.png" class="article-body-image-wrapper"&gt;&lt;img src="https://media2.dev.to/dynamic/image/width=800%2Cheight=%2Cfit=scale-down%2Cgravity=auto%2Cformat=auto/https%3A%2F%2Fdev-to-uploads.s3.amazonaws.com%2Fuploads%2Farticles%2Fz24jhyln4y5lc8jl2h0l.png" alt=" " width="800" height="390"&gt;&lt;/a&gt;&lt;/p&gt;

</description>
      <category>ai</category>
      <category>webdev</category>
      <category>productivity</category>
      <category>programming</category>
    </item>
  </channel>
</rss>
