Diff
checker
文本
文本
图像
文档
Excel
文件夹
Legal
Enterprise
桌面版
定价
登录
下载 Diffchecker 桌面版
比较文本
查找两个文本文件之间的差异
工具
历史
实时编辑器
折叠未更改行
关闭换行
视图
拆分
统一
比对精度
智能
单词
字符
语法高亮
选择语法
忽略
文本转换
转到第一个差异
编辑输入
Diffchecker Desktop
运行Diffchecker最安全的方式。获取Diffchecker桌面应用:您的差异永远不会离开您的电脑!
获取桌面版
Diff
创建于
3年前
差异永不过期
清除
导出
分享
解释
22 删除
行
总计
删除
字符
总计
删除
要继续使用此功能,请升级到
Diff
checker
Pro
查看价格
96 行
全部复制
21 添加
行
总计
添加
字符
总计
添加
要继续使用此功能,请升级到
Diff
checker
Pro
查看价格
96 行
全部复制
import { writeFileSync } from "fs";
import { writeFileSync } from "fs";
import { codePartToCompactString } from "./utils/codePartToCompactString";
import { codePartToCompactString } from "./utils/codePartToCompactString";
import { getFlydeFiles } from "./utils/fs-helpers";
import { getFlydeFiles } from "./utils/fs-helpers";
import { preprocessStdLibParts } from "./utils/preprocessStdLibParts";
import { preprocessStdLibParts } from "./utils/preprocessStdLibParts";
import { join } from "path";
import { join } from "path";
import { chunkArray } from "./utils";
import { chunkArray } from "./utils";
import { readVersionResult } from "./utils/generatePartVersions";
import { readVersionResult } from "./utils/generatePartVersions";
复制
已复制
复制
已复制
import { fullChatInstructions } from "./benchmark/chat-completion-instructions";
(async function () {
(async function () {
const files = getFlydeFiles();
const files = getFlydeFiles();
const parts = preprocessStdLibParts(files);
const parts = preprocessStdLibParts(files);
const partsWithVersions = parts.map((part) => {
const partsWithVersions = parts.map((part) => {
const versionData = readVersionResult(part);
const versionData = readVersionResult(part);
return { ...part, ...versionData };
return { ...part, ...versionData };
});
});
const partsPerNamespace = partsWithVersions.reduce<
const partsPerNamespace = partsWithVersions.reduce<
Record<string, typeof parts>
Record<string, typeof parts>
>((acc, part) => {
>((acc, part) => {
const namespace = part.original.namespace ?? "n/a";
const namespace = part.original.namespace ?? "n/a";
if (!acc[namespace]) {
if (!acc[namespace]) {
acc[namespace] = [];
acc[namespace] = [];
}
}
acc[namespace].push(part);
acc[namespace].push(part);
return acc;
return acc;
}, {});
}, {});
const trainingIds = new Set<string>();
const trainingIds = new Set<string>();
const validationIds = new Set<string>();
const validationIds = new Set<string>();
Object.entries(partsPerNamespace).forEach(([k, parts]) => {
Object.entries(partsPerNamespace).forEach(([k, parts]) => {
const chunks = chunkArray(parts, 10);
const chunks = chunkArray(parts, 10);
chunks.forEach((chunk) => {
chunks.forEach((chunk) => {
chunk.forEach((part, idx) => {
chunk.forEach((part, idx) => {
if (idx === 0 && chunk.length > 4) {
if (idx === 0 && chunk.length > 4) {
validationIds.add(part.original.id);
validationIds.add(part.original.id);
} else {
} else {
trainingIds.add(part.original.id);
trainingIds.add(part.original.id);
}
}
});
});
});
});
});
});
const validationDataset = partsWithVersions.flatMap((part) => {
const validationDataset = partsWithVersions.flatMap((part) => {
if (!validationIds.has(part.original.id)) {
if (!validationIds.has(part.original.id)) {
return [];
return [];
}
}
复制
已复制
复制
已复制
const compactParts =
[
part.original.runFnString,
part.alternativeFunction]
const compactParts =
codePartToCompactString({
.map((code) => ({ ...part.original, runFnString: code }))
...part.original,
.map(codePartToCompactString)
;
runFnString:
part.original.runFnString,
})
;
return part.prompts.map((desc, idx) => {
return part.prompts.map((desc, idx) => {
return {
return {
prompt: desc + "\n\n###\n\n",
prompt: desc + "\n\n###\n\n",
completion: " " + compactParts[idx % 2] + "###",
completion: " " + compactParts[idx % 2] + "###",
};
};
});
});
});
});
const trainingDataset = partsWithVersions.flatMap((part) => {
const trainingDataset = partsWithVersions.flatMap((part) => {
if (!trainingIds.has(part.original.id)) {
if (!trainingIds.has(part.original.id)) {
return [];
return [];
}
}
复制
已复制
复制
已复制
const compactPart
s = [part.original.runFnString, part.alternativeFunction]
const compactPart
=
codePartToCompactString
(
{
.map((code) => ({ ...part.original, runFnString: code }))
...part.original
,
.map(
codePartToCompactString
);
runFnString: part.original.runFnString,
return part.prompts.map((desc, idx) => {
return
{
prompt: desc + "\n\n###\n\n"
,
completion: " " + compactParts[idx % 2] + "###",
};
});
});
复制
已复制
复制
已复制
const prompt = part.prompts[0];
return {
messages: [
{ role: "system", content: fullChatInstructions },
{ role: "user", content: prompt },
{ role: "assistant", content: compactPart },
],
};
});
});
复制
已复制
复制
已复制
console.log(
const datasetFileLocation = join(__dirname, `../dataset
-cc
.json`);
partsWithVersions.length,
trainingDataset.length,
validationDataset.length
);
const datasetFileLocation = join(__dirname, `../dataset
.json`);
writeFileSync(
writeFileSync(
datasetFileLocation,
datasetFileLocation,
JSON.stringify([...trainingDataset, ...validationDataset], null, 2)
JSON.stringify([...trainingDataset, ...validationDataset], null, 2)
);
);
console.log(
console.log(
复制
已复制
复制
已复制
`
Dataset
written to: ${datasetFileLocation}. Remember, the last ${validationDataset.length} entries are validation data.`
`
${trainingDataset.length} examples
written to: ${datasetFileLocation}. Remember, the last ${validationDataset.length} entries are validation data.`
);
);
})();
})();
已保存差异
原始文本
打开文件
import { writeFileSync } from "fs"; import { codePartToCompactString } from "./utils/codePartToCompactString"; import { getFlydeFiles } from "./utils/fs-helpers"; import { preprocessStdLibParts } from "./utils/preprocessStdLibParts"; import { join } from "path"; import { chunkArray } from "./utils"; import { readVersionResult } from "./utils/generatePartVersions"; (async function () { const files = getFlydeFiles(); const parts = preprocessStdLibParts(files); const partsWithVersions = parts.map((part) => { const versionData = readVersionResult(part); return { ...part, ...versionData }; }); const partsPerNamespace = partsWithVersions.reduce< Record<string, typeof parts> >((acc, part) => { const namespace = part.original.namespace ?? "n/a"; if (!acc[namespace]) { acc[namespace] = []; } acc[namespace].push(part); return acc; }, {}); const trainingIds = new Set<string>(); const validationIds = new Set<string>(); Object.entries(partsPerNamespace).forEach(([k, parts]) => { const chunks = chunkArray(parts, 10); chunks.forEach((chunk) => { chunk.forEach((part, idx) => { if (idx === 0 && chunk.length > 4) { validationIds.add(part.original.id); } else { trainingIds.add(part.original.id); } }); }); }); const validationDataset = partsWithVersions.flatMap((part) => { if (!validationIds.has(part.original.id)) { return []; } const compactParts = [part.original.runFnString, part.alternativeFunction] .map((code) => ({ ...part.original, runFnString: code })) .map(codePartToCompactString); return part.prompts.map((desc, idx) => { return { prompt: desc + "\n\n###\n\n", completion: " " + compactParts[idx % 2] + "###", }; }); }); const trainingDataset = partsWithVersions.flatMap((part) => { if (!trainingIds.has(part.original.id)) { return []; } const compactParts = [part.original.runFnString, part.alternativeFunction] .map((code) => ({ ...part.original, runFnString: code })) .map(codePartToCompactString); return part.prompts.map((desc, idx) => { return { prompt: desc + "\n\n###\n\n", completion: " " + compactParts[idx % 2] + "###", }; }); }); console.log( partsWithVersions.length, trainingDataset.length, validationDataset.length ); const datasetFileLocation = join(__dirname, `../dataset.json`); writeFileSync( datasetFileLocation, JSON.stringify([...trainingDataset, ...validationDataset], null, 2) ); console.log( `Dataset written to: ${datasetFileLocation}. Remember, the last ${validationDataset.length} entries are validation data.` ); })();
更改后文本
打开文件
import { writeFileSync } from "fs"; import { codePartToCompactString } from "./utils/codePartToCompactString"; import { getFlydeFiles } from "./utils/fs-helpers"; import { preprocessStdLibParts } from "./utils/preprocessStdLibParts"; import { join } from "path"; import { chunkArray } from "./utils"; import { readVersionResult } from "./utils/generatePartVersions"; import { fullChatInstructions } from "./benchmark/chat-completion-instructions"; (async function () { const files = getFlydeFiles(); const parts = preprocessStdLibParts(files); const partsWithVersions = parts.map((part) => { const versionData = readVersionResult(part); return { ...part, ...versionData }; }); const partsPerNamespace = partsWithVersions.reduce< Record<string, typeof parts> >((acc, part) => { const namespace = part.original.namespace ?? "n/a"; if (!acc[namespace]) { acc[namespace] = []; } acc[namespace].push(part); return acc; }, {}); const trainingIds = new Set<string>(); const validationIds = new Set<string>(); Object.entries(partsPerNamespace).forEach(([k, parts]) => { const chunks = chunkArray(parts, 10); chunks.forEach((chunk) => { chunk.forEach((part, idx) => { if (idx === 0 && chunk.length > 4) { validationIds.add(part.original.id); } else { trainingIds.add(part.original.id); } }); }); }); const validationDataset = partsWithVersions.flatMap((part) => { if (!validationIds.has(part.original.id)) { return []; } const compactParts = codePartToCompactString({ ...part.original, runFnString: part.original.runFnString, }); return part.prompts.map((desc, idx) => { return { prompt: desc + "\n\n###\n\n", completion: " " + compactParts[idx % 2] + "###", }; }); }); const trainingDataset = partsWithVersions.flatMap((part) => { if (!trainingIds.has(part.original.id)) { return []; } const compactPart = codePartToCompactString({ ...part.original, runFnString: part.original.runFnString, }); const prompt = part.prompts[0]; return { messages: [ { role: "system", content: fullChatInstructions }, { role: "user", content: prompt }, { role: "assistant", content: compactPart }, ], }; }); const datasetFileLocation = join(__dirname, `../dataset-cc.json`); writeFileSync( datasetFileLocation, JSON.stringify([...trainingDataset, ...validationDataset], null, 2) ); console.log( `${trainingDataset.length} examples written to: ${datasetFileLocation}. Remember, the last ${validationDataset.length} entries are validation data.` ); })();
查找差异