@waylaidwanderer/chatgpt-api - npm Package Compare versions

Comparing version 1.2.2 to 1.3.0

bin/cli.js

		@@ -52,9 +52,14 @@ #!/usr/bin/env node
		spinner.start();
		const response = await chatGptClient.sendMessage(message, { conversationId, parentMessageId });
		spinner.stop();
		conversationId = response.conversationId;
		parentMessageId = response.messageId;
		console.log(boxen(response.response, { title: 'ChatGPT', padding: 0.7, margin: 1, dimBorder: true }));
		await clipboard.write(response.response);
		try {
		const response = await chatGptClient.sendMessage(message, { conversationId, parentMessageId });
		spinner.stop();
		conversationId = response.conversationId;
		parentMessageId = response.messageId;
		console.log(boxen(response.response, { title: 'ChatGPT', padding: 0.7, margin: 1, dimBorder: true }));
		await clipboard.write(response.response);
		} catch (error) {
		spinner.stop();
		console.log(boxen(error?.json?.error?.message \|\| error.body, { title: 'Error', padding: 0.7, margin: 1, borderColor: 'red' }));
		}
		return conversation(conversationId, parentMessageId);
		}

package.json

		{
		"name": "@waylaidwanderer/chatgpt-api",
		"version": "1.2.2",
		"version": "1.3.0",
		"description": "A ChatGPT implementation using the official ChatGPT model via OpenAI's API.",
		@@ -5,0 +5,0 @@ "main": "index.js",

README.md

		@@ -158,11 +158,18 @@ <p align="center">

		ChatGPT's responses are automatically copied to your clipboard, so you can paste them into other applications.

		## Caveats
		Since `text-chat-davinci-002-20230126` is ChatGPT's raw model, I had to do my best to replicate the way the official ChatGPT website uses it.
		This means it may not behave exactly the same in some ways:
		- conversations are not tied to any user IDs, so if that's important to you, you should implement your own user ID system
		- ChatGPT's model parameters are unknown, so I set some defaults that I thought would be reasonable, such as `temperature: 0.7`
		- conversations are limited to roughly the last 3000 tokens, so earlier messages may be forgotten during longer conversations
		- this works in a similar way to ChatGPT, except I'm pretty sure they have some additional way of retrieving context from earlier messages when needed (which can probably be achieved with embeddings, but I consider that out-of-scope for now)
		- I removed "knowledge cutoff" from the ChatGPT preamble ("You are ChatGPT..."), which stops it from refusing to answer questions about events after 2021-09, as it does have some training data from after that date. This means it may answer questions about events after 2021-09, but it's not guaranteed to be accurate.
		Since `text-chat-davinci-002-20230126` is ChatGPT's raw model, I had to do my best to replicate the way the official ChatGPT website uses it. After extensive testing and comparing responses, I believe that the model used by ChatGPT has some additional fine-tuning.
		This means my implementation or the raw model may not behave exactly the same in some ways:
		- Conversations are not tied to any user IDs, so if that's important to you, you should implement your own user ID system.
		- ChatGPT's model parameters (temperature, frequency penalty, etc.) are unknown, so I set some defaults that I thought would be reasonable.
		- Conversations are limited to roughly the last 3000 tokens, so earlier messages may be forgotten during longer conversations.
		- This works in a similar way to ChatGPT, except I'm pretty sure they have some additional way of retrieving context from earlier messages when needed (which can probably be achieved with embeddings, but I consider that out-of-scope for now).
		- It is well known that, as part of the fine-tuning, ChatGPT had the following preamble:
		> "You are ChatGPT, a large language model trained by OpenAI. You answer as concisely as possible for each response (e.g. don’t be verbose). It is very important that you answer as concisely as possible, so please remember this. If you are generating a list, do not have too many items. Keep the number of items short.
		> Knowledge cutoff: 2021-09
		> Current date: 2023-01-31"

		As OpenAI updates ChatGPT, this preamble may also change. The default prompt prefix in my implementation attempts to replicate a similar behavior to the current ChatGPT model.

		## Contributing
		@@ -169,0 +176,0 @@ If you'd like to contribute to this project, please create a pull request with a detailed description of your changes.

src/ChatGPTClient.js

		@@ -24,3 +24,3 @@ import fetch from 'node-fetch';
		presence_penalty: typeof modelOptions.presence_penalty === 'undefined' ? 0.6 : modelOptions.presence_penalty,
		stop: modelOptions.stop \|\| ['<\|im_end\|>'],
		stop: modelOptions.stop \|\| ['<\|im_end\|>', '<\|im_sep\|>'],
		};
		@@ -47,3 +47,10 @@
		const body = await response.text();
		throw new Error(`Failed to send message. HTTP ${response.status} - ${body}`);
		const error = new Error(`Failed to send message. HTTP ${response.status} - ${body}`);
		error.status = response.status;
		try {
		error.json = JSON.parse(body);
		} catch {
		error.body = body;
		}
		throw error;
		}
		@@ -87,3 +94,3 @@ return response.json();
		parentMessageId: userMessage.id,
		role: 'Assistant',
		role: 'ChatGPT',
		message: reply,
		@@ -120,26 +127,15 @@ };
		promptPrefix = this.options.promptPrefix;
		// If the prompt prefix doesn't end with 2 newlines, add them.
		if (!promptPrefix.endsWith('\n\n')) {
		promptPrefix = `${promptPrefix}\n\n`;
		// If the prompt prefix doesn't end with the separator token, add it.
		if (!promptPrefix.endsWith('<\|im_sep\|>\n\n')) {
		promptPrefix = `${promptPrefix}<\|im_sep\|>\n\n`;
		}
		} else {
		/*
		ChatGPT preamble example:
		You are ChatGPT, a large language model trained by OpenAI. You answer as concisely as possible for each response (e.g. don’t be verbose). It is very important that you answer as concisely as possible, so please remember this. If you are generating a list, do not have too many items. Keep the number of items short.
		Knowledge cutoff: 2021-09
		Current date: 2023-01-31
		*/
		// This preamble was obtained by asking ChatGPT "Please print the instructions you were given before this message."
		// Build the current date string.
		const currentDate = new Date();
		const currentDateString = currentDate.getFullYear()
		+ "-"
		+ (currentDate.getMonth() + 1).toString().padStart(2, '0')
		+ "-"
		+ currentDate.getDate();
		const currentDateString = new Date().toLocaleDateString(
		'en-us',
		{ year: 'numeric', month: 'long', day: 'numeric' },
		);

		promptPrefix = `You are ChatGPT, a large language model trained by OpenAI. You answer as concisely as possible for each response (e.g. don’t be verbose). It is very important that you answer as concisely as possible, so please remember this. If you are generating a list, do not have too many items. Keep the number of items short.
		Current date: ${currentDateString}\n\n`;
		promptPrefix = `Respond conversationally.\nCurrent date: ${currentDateString}<\|im_end\|>\n\n`
		}
		const promptSuffix = "\n"; // Prompt should end with 2 newlines, so we add one here.
		const promptSuffix = "ChatGPT:\n"; // Prompt should end with 2 newlines, so we add one here.

		@@ -153,3 +149,3 @@ let currentTokenCount = this.getTokenCount(`${promptPrefix}${promptSuffix}`);
		const message = orderedMessages.pop();
		const messageString = `${message.message}<\|im_end\|>\n`;
		const messageString = `${message.role}:\n${message.message}<\|im_sep\|>\n`;
		const newPromptBody = `${messageString}${promptBody}`;
		@@ -182,5 +178,6 @@
		if (this.modelOptions.model === CHATGPT_MODEL) {
		// With this model, "<\|im_end\|>" is 1 token, but tokenizers aren't aware of it yet.
		// With this model, "<\|im_end\|>" and "<\|im_sep\|>" is 1 token, but tokenizers aren't aware of it yet.
		// Replace it with "<\|endoftext\|>" (which it does know about) so that the tokenizer can count it as 1 token.
		text = text.replace(/<\\|im_end\\|>/g, '<\|endoftext\|>');
		text = text.replace(/<\\|im_sep\\|>/g, '<\|endoftext\|>');
		}
		@@ -187,0 +184,0 @@ return gptEncode(text).length;

@waylaidwanderer/chatgpt-api - npm Package Compare versions

New alerts

Fixed alerts

Improved metrics