import * as url from "node:url";
import * as path from "node:path";
import * as fs from "node:fs/promises";
import { test, expect } from "@jest/globals";
import { CSVLoader } from "../fs/csv.js";
import { Document } from "../../document.js";
test("Test CSV loader from blob", async () => {
const filePath = path.resolve(
path.dirname(url.fileURLToPath(import.meta.url)),
"./example_data/Star_Wars_The_Clone_Wars_S06E07_Crisis_at_the_Heart.csv"
);
const loader = new CSVLoader(
new Blob([await fs.readFile(filePath)], { type: "text/csv" }),
"html"
);
const docs = await loader.load();
expect(docs.length).toBe(32);
expect(docs[0]).toEqual(
new Document({
metadata: { source: "blob", blobType: "text/csv", line: 1 },
pageContent:
"Corruption discovered at the core of the Banking Clan!",
})
);
expect(docs[1]).toEqual(
new Document({
metadata: { source: "blob", blobType: "text/csv", line: 2 },
pageContent: "Reunited, Rush Clovis and Senator Amidala",
})
);
});
test("Test CSV loader from blob", async () => {
const loader = new CSVLoader(
new Blob(
[
`id,text
1,This is a sentence.
2,This is another sentence.`,
],
{ type: "text/csv" }
)
);
const docs = await loader.load();
expect(docs.length).toBe(2);
expect(docs[0]).toMatchInlineSnapshot(`
Document {
"metadata": {
"blobType": "text/csv",
"line": 1,
"source": "blob",
},
"pageContent": "id: 1
text: This is a sentence.",
}
`);
expect(docs[1]).toMatchInlineSnapshot(`
Document {
"metadata": {
"blobType": "text/csv",
"line": 2,
"source": "blob",
},
"pageContent": "id: 2
text: This is another sentence.",
}
`);
});