mirror of
https://github.com/Mintplex-Labs/anything-llm.git
synced 2024-11-19 12:40:09 +01:00
73 lines
2.1 KiB
JavaScript
73 lines
2.1 KiB
JavaScript
const MimeLib = require("mime");
|
|
const path = require("path");
|
|
class MimeDetector {
|
|
nonTextTypes = ["multipart", "image", "model", "audio", "video"];
|
|
badMimes = [
|
|
"application/octet-stream",
|
|
"application/zip",
|
|
"application/pkcs8",
|
|
"application/vnd.microsoft.portable-executable",
|
|
"application/vnd.openxmlformats-officedocument.spreadsheetml.sheet", // XLSX are binaries and need to be handled explicitly.
|
|
"application/x-msdownload",
|
|
];
|
|
|
|
constructor() {
|
|
this.lib = MimeLib;
|
|
this.setOverrides();
|
|
}
|
|
|
|
setOverrides() {
|
|
// the .ts extension maps to video/mp2t because of https://en.wikipedia.org/wiki/MPEG_transport_stream
|
|
// which has had this extension far before TS was invented. So need to force re-map this MIME map.
|
|
this.lib.define(
|
|
{
|
|
"text/plain": [
|
|
"ts",
|
|
"tsx",
|
|
"py",
|
|
"opts",
|
|
"lock",
|
|
"jsonl",
|
|
"qml",
|
|
"sh",
|
|
"c",
|
|
"cs",
|
|
"h",
|
|
"js",
|
|
"lua",
|
|
"pas",
|
|
"r",
|
|
"go",
|
|
],
|
|
},
|
|
true
|
|
);
|
|
}
|
|
|
|
// These are file types that are not detected by the mime library and need to be processed as text files.
|
|
// You should only add file types that are not detected by the mime library, are parsable as text, and are files
|
|
// with no extension. Otherwise, their extension should be added to the overrides array.
|
|
#specialTextFileTypes = ["dockerfile", "jenkinsfile"];
|
|
|
|
/**
|
|
* Returns the MIME type of the file. If the file has no extension found, it will be processed as a text file.
|
|
* @param {string} filepath
|
|
* @returns {string}
|
|
*/
|
|
getType(filepath) {
|
|
const parsedMime = this.lib.getType(filepath);
|
|
if (!!parsedMime) return parsedMime;
|
|
|
|
// If the mime could not be parsed, it could be a special file type like Dockerfile or Jenkinsfile
|
|
// which we can reliably process as text files.
|
|
const baseName = path.basename(filepath)?.toLowerCase();
|
|
if (this.#specialTextFileTypes.includes(baseName)) return "text/plain";
|
|
|
|
return null;
|
|
}
|
|
}
|
|
|
|
module.exports = {
|
|
MimeDetector,
|
|
};
|