update

2025-12-08 15:27:18 +08:00
parent f87538350c
commit 02ef7b3476
12 changed files with 1 additions and 471 deletions
--- a/package.json
+++ b/package.json
@@ -1,6 +1,6 @@
 {
  "name": "@kevisual/ai",
-  "version": "0.0.18",
+  "version": "0.0.19",
  "description": "AI Center Services",
  "main": "index.js",
  "basename": "/root/ai-center-services",
--- a/src/test/aliyun/test.ts
+++ b/src/test/aliyun/test.ts
@@ -1,59 +0,0 @@
-import { BailianProvider } from '../../provider/index.ts'
-import dotenv from 'dotenv';
-
-dotenv.config();
-import { App } from '@kevisual/router'
-import util from 'node:util';
-const ai = new BailianProvider({
-  apiKey: process.env.BAILIAN_API_KEY || '',
-  model: 'qwen-turbo-latest',
-  baseURL: 'https://dashscope.aliyuncs.com/compatible-mode/v1'
-})
-
-
-// const res = await ai.chat([
-
-//   {
-//     role: 'user',
-//     content: `1+1等于多少？`
-//   },
-
-// ],
-// )
-// // console.log('AI Response:', res);
-// const content = res.choices[0].message?.content || ''
-
-// console.log(util.inspect(res, { depth: null }))
-
-// console.log('responseText', ai.responseText)
-
-
-// const res = await ai.chatStream([
-
-//   {
-//     role: 'user',
-//     content: `1+1等于多少？`
-//   },
-
-// ],
-// )
-// // console.log('AI Response:', res);
-// export const readStream = async (chatStream) => {
-//   let buffer = '';
-//   for await (const chunk of chatStream) {
-//     // chunk 已经是解码后的字符串，直接拼接即可
-//     buffer += chunk;
-//   }
-//   console.log('AI Response:', buffer);
-// };
-
-// await readStream(res);
-
-const embe = await ai.generateEmbeddingCore([
-  '你好，世界！',
-  'Hello, world!',
-], {
-  model: 'text-embedding-v4'
-});
-
-console.log('Embedding Response:', util.inspect(embe, { depth: null }));
--- a/src/test/chunks/01-get.ts
+++ b/src/test/chunks/01-get.ts
@@ -1,65 +0,0 @@
-import { getChunks } from '../../provider/utils/chunk.ts';
-
-const str = 'Hello world this is a test 你好沙盒 very big';
-
-
-const str2 = `不能直接使用 tiktoken（OpenAI的分词器）来计算 Qwen 模型的 Token 数量，因为两者的分词规则（Tokenization）和词表（Vocabulary）完全不同。
-
-为什么不能混用？
-词表不同
-
-tiktoken 是 OpenAI 为 GPT 系列设计的（如 gpt-3.5-turbo, gpt-4），其词表针对英语和代码优化。
-
-Qwen 使用独立训练的 BPE 词表，对中文、多语言的支持更友好，分词粒度可能不同。
-
-分词结果差异大
-同一段文本，tiktoken 和 Qwen 的分词结果可能完全不同。例如：
-
-OpenAI (tiktoken): "你好" → ['你', '好']（2 Tokens）
-
-Qwen: "你好" → ['你好']（1 Token，如果词表中包含该组合）
-
-性能问题
-即使强制使用 tiktoken 计算 Qwen 的 Token，结果也不准确，可能导致：
-
-输入超出模型上下文限制（因统计偏差）。
-
-API 计费或本地推理时出现意外错误。
-
-正确方法：用 Qwen 的分词器
-通过 Hugging Face transformers 加载 Qwen 的原生分词器：
-
-python
-复制
-from transformers import AutoTokenizer
-
-# 加载 Qwen 的分词器（以 Qwen-7B 为例）
-tokenizer = AutoTokenizer.from_pretrained("Qwen/Qwen-7B", trust_remote_code=True)
-
-text = "你好，Qwen模型！"
-tokens = tokenizer.tokenize(text)  # 查看分词结果
-token_count = len(tokenizer.encode(text, add_special_tokens=False))
-
-print("分词结果:", tokens)
-print("Token数量:", token_count)
-常见问题
-为什么需要 trust_remote_code=True？
-Qwen 的分词器是自定义实现的（非 Hugging Face 原生），此参数允许从模型仓库加载运行代码。
-
-其他语言的 Token 计算？
-Qwen 对非英语（如中文、日文）的分词效率较高，但仍需用其原生分词器统计。
-
-与 tiktoken 的速度对比？
-tiktoken 是纯 Python 实现，速度较快；Qwen 的分词器基于 Hugging Face，可能稍慢但对齐模型需求。
-
-总结
-禁止混用：tiktoken ≠ Qwen 分词器。
-
-始终使用模型配套工具：Qwen 需通过 transformers 加载其官方分词器。
-
-中文场景特别注意：Qwen 对中文的分词更高效，直接使用可避免偏差。
-
-如果需要验证分词规则，可通过 tokenizer.vocab 查看词表内容（但注意词表通常较大）。`
-
-const chunks = getChunks(str2);
-console.log(chunks);
--- a/src/test/common.ts
+++ b/src/test/common.ts
@@ -1,18 +0,0 @@
-import { Jimen } from "../jimeng/index.ts"
-import dotenv from 'dotenv';
-dotenv.config();
-
-const jimeng = new Jimen({
-  token: process.env.JIMENG_TOKEN,
-})
-
-console.log("Generating image...");
-
-await jimeng.generateImage({
-  prompt: "创建一幅未来城市的数字艺术作品，充满科技感和创新元素，色彩鲜艳，细节丰富",
-  resolution: "2k"
-}).then((res) => {
-  console.log("Image generation response:", res);
-}).catch((err) => {
-  console.error("Error generating image:", err);
-});
--- a/src/test/encrypt/index.ts
+++ b/src/test/encrypt/index.ts
@@ -1,9 +0,0 @@
-import { encryptAES, decryptAES } from '../..//provider/utils/parse-config.ts';
-
-const plainx = process.env.API_KEY;
-const decryptKey = process.env.DECRYPT_KEY;
-const encrypt = encryptAES(plainx, decryptKey);
-console.log('encrypt', encrypt);
-
-const decrypt = decryptAES(encrypt, decryptKey);
-console.log(decrypt);
--- a/src/test/func-call/curl.sh
+++ b/src/test/func-call/curl.sh
@@ -1,35 +0,0 @@
-curl --request POST \
-  --url https://api.siliconflow.cn/v1/chat/completions \
-  --header 'Authorization: Bearer sk-qbiigkzoaamuqxtwlgkugodncebkfbosemadfubjrseobpvx' \
-  --header 'Content-Type: application/json' \
-  --data '{
-  "model": "Qwen/Qwen3-14B",
-  "messages": [
-    {
-      "role": "user",
-      "content": "计算a+b的值"
-    }
-  ],
-  "stream": false,
-  "max_tokens": 512,
-  "stop": null,
-  "temperature": 0.7,
-  "top_p": 0.7,
-  "top_k": 50,
-  "frequency_penalty": 0.5,
-  "n": 1,
-  "response_format": {
-    "type": "text"
-  },
-  "tools": [
-    {
-      "type": "function",
-      "function": {
-        "description": "计算a，b，c算法的值，a=1，b=2，c=3",
-        "name": "compouted",
-        "parameters": {},
-        "strict": false
-      }
-    }
-  ]
-}'
--- a/src/test/func-call/demo.ts
+++ b/src/test/func-call/demo.ts
@@ -1,116 +0,0 @@
-import { SiliconFlow } from '../../provider/chat-adapter/siliconflow.ts';
-import { Ollama } from '../../provider/chat-adapter/ollama.ts';
-import dotenv from 'dotenv';
-
-dotenv.config();
-const siliconflow = new SiliconFlow({
-  apiKey: process.env.SILICONFLOW_API_KEY,
-  model: 'Qwen/Qwen3-14B',
-});
-const ollama = new Ollama({
-  model: 'qwen3:32b',
-  apiKey: process.env.OLLAMA_API_KEY,
-  baseURL: process.env.OLLAMA_BASE_URL,
-});
-const main = async () => {
-  const usage = await siliconflow.getUsageInfo();
-  console.log(usage);
-};
-// 1. 定义工具函数
-const availableFunctions: Record<string, (args: any) => Promise<any>> = {
-  get_time: async (args: { location: string }) => {
-    // 模拟API调用
-    console.log('time', args);
-    return {
-      time: '2022-03-22 12:00:00',
-    };
-  },
-  get_location: async (args: { symbol: string }) => {
-    // 模拟API调用
-    console.log('location', args);
-    return {
-      city: 'Beijing',
-    };
-  },
-};
-
-// main();
-const funcCall = async (model = siliconflow) => {
-  const tools = [
-    {
-      type: 'function',
-      function: {
-        name: 'get_time',
-        description: '获取当前时间',
-        parameters: {
-          type: 'object',
-          properties: {
-            place: {
-              type: 'string',
-              description: '位置',
-            },
-          },
-          required: ['place'],
-        },
-      },
-    },
-    {
-      type: 'function',
-      function: {
-        name: 'get_location',
-        description: '获取当前位置',
-        // parameters: {},
-        parameters: {},
-        strict: false,
-      },
-    },
-  ];
-  const messages: any[] = [{ role: 'user', content: '获取当前位置的当前时间' }];
-  const res = await model.chat(messages, {
-    tools: tools as any,
-  });
-  console.log(res.choices[0]);
-  const assistantMessage = res.choices[0].message;
-  const finish_reason = res.choices[0].finish_reason;
-  messages.push(assistantMessage);
-  let toolCalls = assistantMessage.tool_calls;
-  console.log("toolCalls", JSON.stringify(toolCalls));
-  let maxRetries = 3;
-  while (toolCalls && toolCalls.length > 0) {
-    // 处理每个函数调用
-    for (const toolCall of toolCalls) {
-      const functionName = toolCall.function.name;
-      const functionArgs = JSON.parse(toolCall.function.arguments);
-      // 调用本地函数
-      const functionResponse = await availableFunctions[functionName](functionArgs);
-      // 将结果添加到消息历史
-      messages.push({
-        role: 'tool',
-        name: functionName,
-        content: JSON.stringify(functionResponse),
-        tool_call_id: toolCall.id,
-      });
-    }
-
-    // 第二次调用 - 将函数结果发送给模型获取最终回复
-    const secondResponse = await model.chat(messages, {
-      tools: tools as any,
-    });
-
-    const finalMessage = secondResponse.choices[0].message;
-    messages.push(finalMessage);
-    const _toolCalls = finalMessage.tool_calls;
-    console.log("toolCalls", JSON.stringify(toolCalls) ,finalMessage.role);
-    toolCalls = _toolCalls ? _toolCalls : [];
-    maxRetries--;
-    if (maxRetries <= 0) {
-      break;
-    }
-    
-    console.log('tool calls', toolCalls);
-  }
-
-  console.log(messages);
-};
-
-funcCall(ollama as any);
--- a/src/test/model-scope/index.ts
+++ b/src/test/model-scope/index.ts
@@ -1,26 +0,0 @@
-import { ModelScope } from '../../provider/chat-adapter/model-scope.ts';
-import { logger } from '../../modules/logger.ts';
-import util from 'util';
-import { config } from 'dotenv';
-config();
-
-const chat = new ModelScope({
-  apiKey: process.env.MODEL_SCOPE_API_KEY,
-  model: 'Qwen/Qwen2.5-Coder-32B-Instruct',
-});
-
-// chat.chat([{ role: 'user', content: 'Hello, world! 1 + 1 equals ?' }]);
-const chatMessage = [{ role: 'user', content: 'Hello, world! 1 + 1 equals ?' }];
-
-const main = async () => {
-  const res = await chat.test();
-  logger.info('test', res);
-};
-
-main();
-const mainChat = async () => {
-  const res = await chat.chat(chatMessage as any);
-  logger.info('chat', res);
-};
-
-// mainChat();
--- a/src/test/ollama-knowledge.ts
+++ b/src/test/ollama-knowledge.ts
@@ -1,37 +0,0 @@
-import { Knowledge } from '../../../../src/provider/knowledge/knowledge.ts';
-import fs from 'fs';
-import dotenv from 'dotenv';
-
-dotenv.config();
-const knowledge = new Knowledge({
-  embeddingModel: 'bge-m3:latest',
-  baseURL: 'https://ollama.xiongxiao.me/v1',
-  model: 'qwq:latest',
-  apiKey: process.env.OLLAMA_API_KEY,
-});
-
-const main = async () => {
-  const res = await knowledge.generateEmbeddingCore('Hello world this is a test 你好沙盒 very big');
-  fs.writeFileSync('docs/embedding.json', JSON.stringify(res, null, 2));
-  console.log(res);
-};
-
-main();
-
-const main2 = async () => {
-  const text1 = 'Hello, world! this is a test';
-  const text2 = 'Hello, world! this is a test 2';
-  const text3 = 'Hello, world! this is a test 3';
-  const text4 = 'Hello, world! this is a test 4';
-  const text5 = 'Hello, world! this is a test 5';
-  const text6 = 'Hello, world! this is a test 6';
-  const text7 = 'Hello, world! this is a test 7';
-  const text8 = 'Hello, world! this is a test 8';
-  const text9 = 'Hello, world! this is a test 9';
-  const text10 = 'Hello, world! this is a test 10';
-  const res = await knowledge.generateEmbeddingCore([text1, text2, text3, text4, text5, text6, text7, text8, text9, text10]);
-  fs.writeFileSync('docs/embedding2.json', JSON.stringify(res, null, 2));
-  console.log(res);
-};
-
-// main2();
--- a/src/test/ollama.ts
+++ b/src/test/ollama.ts
@@ -1,86 +0,0 @@
-import { Ollama } from '../../../../src/provider/chat-adapter/ollama.ts';
-import util from 'util';
-const chat = new Ollama({
-  baseURL: 'https://ollama.xiongxiao.me/v1',
-  apiKey: 'xiongxiao2233',
-  model: 'qwq:latest',
-});
-
-// chat.chat([{ role: 'user', content: 'Hello, world!' }]);
-
-const main = async () => {
-  const res = await chat.test();
-  console.log(util.inspect(res, { depth: null, colors: true }));
-};
-
-// main();
-
-const getJson = async () => {
-  const res = await chat.chat(
-    [
-      { role: 'system', content: '把发送的数据，返回给我对应的json，只处理完发送的数据。如果发送了多个，给我一个数组' },
-      // { role: 'user', content: '{"name":"John","age":30}' },
-      { role: 'user', content: 'name: 张三' },
-      { role: 'user', content: 'name: 李四, age: 18' },
-    ],
-    {
-      response_format: {
-        type: 'json_schema',
-        json_schema: {
-          name: 'user',
-          description: '用户信息',
-          schema: {
-            type: 'object',
-            // properties: {
-            //   name: { type: 'string' },
-            //   // age: { type: 'number' },
-            // },
-            // // required: ['name', 'age'],
-            // required: ['name'],
-            properties: {
-              name: { type: 'string' },
-              age: { type: 'number' },
-            },
-            required: ['name', 'age'],
-          },
-        },
-      },
-      n: 10,
-    },
-  );
-  console.log(util.inspect(res, { depth: null, colors: true }));
-};
-
-// getJson();
-
-const createChat1 = async () => {
-  const res = await chat.chat(
-    [
-      { role: 'user', content: 'a=1, b=2, c=3' },
-      { role: 'user', content: 'a+b+c=?' },
-      { role: 'assistant', content: '给定的值为 \\( a = 1 \\), \\( b = 2 \\), \\( c = 3 \\)。\n' + '\n' + '因此，\\( a + b + c = 1 + 2 + 3 = 6 \\)。' },
-      { role: 'user', content: 'a+b+c+4=?' },
-    ],
-    {
-      model: 'qwen2.5:7b',
-    },
-  );
-  console.log(util.inspect(res, { depth: null, colors: true }));
-};
-
-//  createChat1();
-
-const getTags = async () => {
-  const res = await chat.listModels();
-  console.log(util.inspect(res, { depth: null, colors: true }));
-};
-
-// getTags();
-
-const getRunModels = async () => {
-  const res = await chat.listRunModels();
-  console.log('current', new Date().toISOString());
-  console.log(util.inspect(res, { depth: null, colors: true }));
-};
-
-// getRunModels();
--- a/src/test/provider/index.ts
+++ b/src/test/provider/index.ts
@@ -1,7 +0,0 @@
-import { ProviderManager } from '../..//provider/index.ts';
-import { config } from 'dotenv';
-config();
-const providerConfig = { provider: 'ModelScope', model: 'Qwen/Qwen2.5-Coder-32B-Instruct', apiKey: process.env.MODEL_SCOPE_API_KEY };
-const provider = await ProviderManager.createProvider(providerConfig);
-const result = await provider.chat([{ role: 'user', content: '你好' }]);
-console.log(result);
--- a/src/utils/json.ts
+++ b/src/utils/json.ts
@@ -1,12 +0,0 @@
-/**
- * 尝试从字符串中提取JSON对象
- */
-export const getJsonFromString = (str: string) => {
-  try {
-    const jsonMatch = str.match(/```json\s*([\s\S]*?)\s*```/);
-    if (jsonMatch && jsonMatch[1]) {
-      return JSON.parse(jsonMatch[1]);
-    }
-  } catch (error) {}
-  return null;
-};