sg-proxy/main.js

require("dotenv").config();

const express = require('express');
const axios = require('axios');
const app = express();
const StringDecoder = require('string_decoder').StringDecoder;

const bodyParser = require('body-parser');
app.use(bodyParser.json({ limit: '100mb' }));
app.use(bodyParser.urlencoded({limit: '100mb', extended: true}));

const API_TOKEN = process.env.API_TOKEN;

function handleError(res, isStream) {
  // If the request hasn't finished, notify the user that there was an error and finish
  // the request properly, so that ST isn't left hanging.
  const errMsg = "\n**Received an error during the request, please check sg-proxy logs!**";
  let jsonResp = {completion: errMsg, stop_reason: "stop_sequence"};
  if (!res.writableEnded) {
    if (isStream) {
      res.write(`event: completion\r\ndata: ${JSON.stringify(jsonResp)}\r\n\r\n`);
    } else {
      // This is unlikely to trigger, but can happen if the error was caught
      // before the request was sent (without streaming)
      res.json(jsonResp);
    }
    res.end();
  }
}

app.post('/v1/complete', async (req, res) => {
  res.setHeader('Content-Type', 'text/event-stream; charset=utf-8');
  res.setHeader('Cache-Control', 'no-cache');
  res.setHeader('Connection', 'keep-alive');
  res.setHeader('Transfer-Encoding', 'chunked');
  res.flushHeaders();
  
  //console.log(req.body);
  // Those are required and must always be present
  const model = req.body.model;
  const maxTokens = req.body.max_tokens_to_sample;
  const prompt = req.body.prompt;

  const temp = req.body.temperature || 1.0;
  const top_p = req.body.top_p || null;
  const top_k = req.body.top_k || null;
  const stopSequences = req.body.stop_sequences || null;
  const isStream = req.body.stream || false;

  console.log(`Doing a request with stream = ${isStream}.`)
  // Set up axios instance for SSE
  const sourcegraph = axios.create({
    baseURL: 'https://sourcegraph.com/.api/completions/stream',
    headers: {
      'Content-Type': 'application/json',
      'Authorization': `token ${API_TOKEN}`
    },
    responseType: 'stream',
    timeout: 180000,
  });

  let fullContent = "";

  try {
    let postData = {
      model: model,
      prompt: prompt,
      maxTokensToSample: maxTokens
    };
    
    if (temp) postData.temperature = temp;
    if (stopSequences) postData.stop_sequences = stopSequences;
    if (top_p) postData.top_p = top_p;
    if (top_k) postData.top_k = top_k;
    const response = await sourcegraph.post('', postData);

    let previousCompletion = "";
    // GPT-4 told me to use a StringDecoder so that multi-byte characters are correctly handled across chunks
    let decoder = new StringDecoder('utf8');
    let buffer = ""; // Buffer to hold incomplete lines

    response.data.on('data', (chunk) => {
      buffer += decoder.write(chunk);
      let lines = buffer.split("\n");
      buffer = lines.pop(); // Keep the last (potentially incomplete) line in the buffer

      const data = lines.filter(line => line.startsWith('data: ')).map(line => line.replace(/^data: /, ''));

      data.forEach((chunk) => {
        try {
          const parsedData = JSON.parse(chunk);
          if ('completion' in parsedData) {
            //console.log(resp);
            if (isStream) {
              // SourceGraph API always returns the full string, but we need the diff
              // We can use .length because StringDecoder correctly handles multi-byte characters
              const newPart = parsedData.completion.substring(previousCompletion.length); 
              previousCompletion = parsedData.completion;
              let resp = { completion: newPart, stop_reason: null };
              res.write(`event: completion\r\ndata: ${JSON.stringify(resp)}\r\n\r\n`);
            }
            else {
              fullContent = parsedData.completion;
            }
          }
        } catch (error) {
          console.log("Invalid JSON chunk: ", chunk);
          // do nothing, the JSON chunk is incomplete
      }})
    });

    response.data.on('end', () => {
      // Since the last char will be a newline char and not a multi-byte one, we're sure that
      // the decoder will be empty, so we can just end it.
      decoder.end();
      
      if (isStream) {
        let finalResp = {completion: "", stop_reason: "stop_sequence"};
        res.write(`event: completion\r\ndata: ${JSON.stringify(finalResp)}\r\n\r\n`);
      }
      else {
        res.write(JSON.stringify({completion: fullContent, stop_reason: "stop_sequence"}));
      }
      res.end();
      console.log(`Request done.`)
    });

  } catch (error) {
    console.error("Got an error in the main route:\n", error);
    handleError(res, isStream);
  }
});

app.use((err, req, res, next) => {
  console.log("Got an unhandled exception:\n", err);
  handleError(res, req.body && req.body.stream || false);
});

process.on('uncaughtException', (err) => {
  console.error('Uncaught exception:', err);
});

process.on('unhandledRejection', (reason, promise) => {
  console.error('Unhandled Promise Rejection:', reason);
});

async function checkToken(token) {
  const data = {
    query: 'query { currentUser { username } }'
  };

  const config = {
    method: 'post',
    url: 'https://sourcegraph.com/.api/graphql',
    headers: { 
      'Authorization': `token ${token}`
    },
    data: data
  };

  try {
    const response = await axios(config);
    if(response.data && response.data.data && response.data.data.currentUser) {
      console.log(`Token works, username: ${response.data.data.currentUser.username}`);
      return true;
    } else {
      return false;
    }
  } catch (error) {
    return false;
  }
}

// Two basic checks
if (!API_TOKEN) {
  console.error("SourceGraph API token not found! Create a file named '.env' and put your token there as an API_TOKEN. See .env.example for an example.");
  process.exit(1);
}
else if (API_TOKEN.indexOf("sgp_") == -1) {
  console.error("Invalid SourceGraph API token! Make sure you copied the whole token starting with sgp_, like 'sgp_blablabla'.");
  process.exit(1);
}

// Check token validity
checkToken(API_TOKEN).then(isValid => {
  if (!isValid) {
    console.error("Invalid SourceGraph API token! Make sure you copied the whole token and that the token is not revoked.");
    process.exit(1);
  }

  const port = process.env.PORT || 3000;
  app.listen(port, () => console.log(`Server listening on port ${port}`));
});
first commit 2023-08-28 03:46:12 -06:00			`require("dotenv").config();`

			`const express = require('express');`
			`const axios = require('axios');`
			`const app = express();`
Fix #2, add execute bit to start.sh 2023-08-30 01:52:24 -06:00			`const StringDecoder = require('string_decoder').StringDecoder;`

Change body limit from default, show help with context 2023-08-29 04:03:11 -06:00			`const bodyParser = require('body-parser');`
			`app.use(bodyParser.json({ limit: '100mb' }));`
			`app.use(bodyParser.urlencoded({limit: '100mb', extended: true}));`
first commit 2023-08-28 03:46:12 -06:00
			`const API_TOKEN = process.env.API_TOKEN;`

Fix #1 by adding proper error handling (and notifying the user about it) 2023-08-30 02:09:12 -06:00			`function handleError(res, isStream) {`
			`// If the request hasn't finished, notify the user that there was an error and finish`
			`// the request properly, so that ST isn't left hanging.`
			`const errMsg = "\nReceived an error during the request, please check sg-proxy logs!";`
			`let jsonResp = {completion: errMsg, stop_reason: "stop_sequence"};`
			`if (!res.writableEnded) {`
			`if (isStream) {`
			res.write(`event: completion\r\ndata: ${JSON.stringify(jsonResp)}\r\n\r\n`);
			`} else {`
			`// This is unlikely to trigger, but can happen if the error was caught`
			`// before the request was sent (without streaming)`
			`res.json(jsonResp);`
			`}`
			`res.end();`
			`}`
			`}`

first commit 2023-08-28 03:46:12 -06:00			`app.post('/v1/complete', async (req, res) => {`
			`res.setHeader('Content-Type', 'text/event-stream; charset=utf-8');`
			`res.setHeader('Cache-Control', 'no-cache');`
			`res.setHeader('Connection', 'keep-alive');`
			`res.setHeader('Transfer-Encoding', 'chunked');`
			`res.flushHeaders();`

			`//console.log(req.body);`
Fix #1 by adding proper error handling (and notifying the user about it) 2023-08-30 02:09:12 -06:00			`// Those are required and must always be present`
first commit 2023-08-28 03:46:12 -06:00			`const model = req.body.model;`
Fix #1 by adding proper error handling (and notifying the user about it) 2023-08-30 02:09:12 -06:00			`const maxTokens = req.body.max_tokens_to_sample;`
			`const prompt = req.body.prompt;`

first commit 2023-08-28 03:46:12 -06:00			`const temp = req.body.temperature \|\| 1.0;`
			`const top_p = req.body.top_p \|\| null;`
			`const top_k = req.body.top_k \|\| null;`
			`const stopSequences = req.body.stop_sequences \|\| null;`
Added non-streaming support 2023-08-28 04:39:57 -06:00			`const isStream = req.body.stream \|\| false;`
first commit 2023-08-28 03:46:12 -06:00
Added non-streaming support 2023-08-28 04:39:57 -06:00			console.log(`Doing a request with stream = ${isStream}.`)
first commit 2023-08-28 03:46:12 -06:00			`// Set up axios instance for SSE`
			`const sourcegraph = axios.create({`
			`baseURL: 'https://sourcegraph.com/.api/completions/stream',`
			`headers: {`
			`'Content-Type': 'application/json',`
			'Authorization': `token ${API_TOKEN}`
			`},`
			`responseType: 'stream',`
			`timeout: 180000,`
			`});`

Added non-streaming support 2023-08-28 04:39:57 -06:00			`let fullContent = "";`

first commit 2023-08-28 03:46:12 -06:00			`try {`
			`let postData = {`
			`model: model,`
			`prompt: prompt,`
			`maxTokensToSample: maxTokens`
			`};`

			`if (temp) postData.temperature = temp;`
			`if (stopSequences) postData.stop_sequences = stopSequences;`
			`if (top_p) postData.top_p = top_p;`
			`if (top_k) postData.top_k = top_k;`
			`const response = await sourcegraph.post('', postData);`

			`let previousCompletion = "";`
Fix #2, add execute bit to start.sh 2023-08-30 01:52:24 -06:00			`// GPT-4 told me to use a StringDecoder so that multi-byte characters are correctly handled across chunks`
			`let decoder = new StringDecoder('utf8');`
first commit 2023-08-28 03:46:12 -06:00			`let buffer = ""; // Buffer to hold incomplete lines`

			`response.data.on('data', (chunk) => {`
Fix #2, add execute bit to start.sh 2023-08-30 01:52:24 -06:00			`buffer += decoder.write(chunk);`
first commit 2023-08-28 03:46:12 -06:00			`let lines = buffer.split("\n");`
			`buffer = lines.pop(); // Keep the last (potentially incomplete) line in the buffer`

			`const data = lines.filter(line => line.startsWith('data: ')).map(line => line.replace(/^data: /, ''));`

			`data.forEach((chunk) => {`
			`try {`
			`const parsedData = JSON.parse(chunk);`
			`if ('completion' in parsedData) {`
			`//console.log(resp);`
Added non-streaming support 2023-08-28 04:39:57 -06:00			`if (isStream) {`
			`// SourceGraph API always returns the full string, but we need the diff`
Fix #2, add execute bit to start.sh 2023-08-30 01:52:24 -06:00			`// We can use .length because StringDecoder correctly handles multi-byte characters`
			`const newPart = parsedData.completion.substring(previousCompletion.length);`
Added non-streaming support 2023-08-28 04:39:57 -06:00			`previousCompletion = parsedData.completion;`
			`let resp = { completion: newPart, stop_reason: null };`
			res.write(`event: completion\r\ndata: ${JSON.stringify(resp)}\r\n\r\n`);
			`}`
			`else {`
			`fullContent = parsedData.completion;`
			`}`
first commit 2023-08-28 03:46:12 -06:00			`}`
			`} catch (error) {`
Fix #2, add execute bit to start.sh 2023-08-30 01:52:24 -06:00			`console.log("Invalid JSON chunk: ", chunk);`
			`// do nothing, the JSON chunk is incomplete`
first commit 2023-08-28 03:46:12 -06:00			`}})`
			`});`

			`response.data.on('end', () => {`
Fix #2, add execute bit to start.sh 2023-08-30 01:52:24 -06:00			`// Since the last char will be a newline char and not a multi-byte one, we're sure that`
			`// the decoder will be empty, so we can just end it.`
			`decoder.end();`

Added non-streaming support 2023-08-28 04:39:57 -06:00			`if (isStream) {`
			`let finalResp = {completion: "", stop_reason: "stop_sequence"};`
			res.write(`event: completion\r\ndata: ${JSON.stringify(finalResp)}\r\n\r\n`);
			`}`
			`else {`
			`res.write(JSON.stringify({completion: fullContent, stop_reason: "stop_sequence"}));`
			`}`
misc 2023-08-28 04:42:41 -06:00			`res.end();`
			console.log(`Request done.`)
first commit 2023-08-28 03:46:12 -06:00			`});`

			`} catch (error) {`
Fix #1 by adding proper error handling (and notifying the user about it) 2023-08-30 02:09:12 -06:00			`console.error("Got an error in the main route:\n", error);`
			`handleError(res, isStream);`
first commit 2023-08-28 03:46:12 -06:00			`}`
			`});`

			`app.use((err, req, res, next) => {`
Fix #1 by adding proper error handling (and notifying the user about it) 2023-08-30 02:09:12 -06:00			`console.log("Got an unhandled exception:\n", err);`
			`handleError(res, req.body && req.body.stream \|\| false);`
first commit 2023-08-28 03:46:12 -06:00			`});`

			`process.on('uncaughtException', (err) => {`
			`console.error('Uncaught exception:', err);`
			`});`

			`process.on('unhandledRejection', (reason, promise) => {`
			`console.error('Unhandled Promise Rejection:', reason);`
			`});`

Add proper token checking, just have .env directly in here 2023-08-28 05:04:54 -06:00			`async function checkToken(token) {`
			`const data = {`
			`query: 'query { currentUser { username } }'`
			`};`

			`const config = {`
			`method: 'post',`
			`url: 'https://sourcegraph.com/.api/graphql',`
			`headers: {`
			'Authorization': `token ${token}`
			`},`
			`data: data`
			`};`

			`try {`
			`const response = await axios(config);`
			`if(response.data && response.data.data && response.data.data.currentUser) {`
			console.log(`Token works, username: ${response.data.data.currentUser.username}`);
			`return true;`
			`} else {`
			`return false;`
			`}`
			`} catch (error) {`
			`return false;`
			`}`
			`}`

			`// Two basic checks`
Add basic token sanity checks 2023-08-28 04:50:56 -06:00			`if (!API_TOKEN) {`
			`console.error("SourceGraph API token not found! Create a file named '.env' and put your token there as an API_TOKEN. See .env.example for an example.");`
Add proper token checking, just have .env directly in here 2023-08-28 05:04:54 -06:00			`process.exit(1);`
Add basic token sanity checks 2023-08-28 04:50:56 -06:00			`}`
			`else if (API_TOKEN.indexOf("sgp_") == -1) {`
Add proper token checking, just have .env directly in here 2023-08-28 05:04:54 -06:00			`console.error("Invalid SourceGraph API token! Make sure you copied the whole token starting with sgp_, like 'sgp_blablabla'.");`
			`process.exit(1);`
Add basic token sanity checks 2023-08-28 04:50:56 -06:00			`}`

Add proper token checking, just have .env directly in here 2023-08-28 05:04:54 -06:00			`// Check token validity`
			`checkToken(API_TOKEN).then(isValid => {`
			`if (!isValid) {`
license + misc changes 2023-08-28 05:38:59 -06:00			`console.error("Invalid SourceGraph API token! Make sure you copied the whole token and that the token is not revoked.");`
Add proper token checking, just have .env directly in here 2023-08-28 05:04:54 -06:00			`process.exit(1);`
			`}`

			`const port = process.env.PORT \|\| 3000;`
			app.listen(port, () => console.log(`Server listening on port ${port}`));
			`});`