All files / src/utils FileLoader.ts

97.43% Statements 38/39
85.29% Branches 29/34
100% Functions 1/1
97.36% Lines 37/38

Press n or j to go to the next uncovered block, b, p or k for the previous block.

1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152        81x                                                                       81x                                                       59x 13x 13x 12x   11x 11x 13x 13x 13x   13x 8x     3x 2x 2x                 1x 1x             2x       46x 6x     40x 40x   59x 24x 24x             16x 16x 16x   16x 7x     9x   2x 2x                 7x   3x       4x      
import { promises as fs } from "fs";
import * as path from "path";
import { ContentPart } from "../chat/Content.js";
 
const MIME_TYPES: Record<string, string> = {
  ".jpg": "image/jpeg",
  ".jpeg": "image/jpeg",
  ".png": "image/png",
  ".gif": "image/gif",
  ".webp": "image/webp",
  ".mp4": "video/mp4",
  ".mpeg": "video/mpeg",
  ".mov": "video/quicktime",
  ".wav": "audio/wav",
  ".mp3": "audio/mpeg",
  ".json": "application/json",
  ".js": "text/javascript",
  ".mjs": "text/javascript",
  ".cjs": "text/javascript",
  ".ts": "text/typescript",
  ".rb": "text/x-ruby",
  ".py": "text/x-python",
  ".txt": "text/plain",
  ".md": "text/markdown",
  ".html": "text/html",
  ".css": "text/css",
  ".xml": "text/xml",
  ".yml": "text/yaml",
  ".yaml": "text/yaml",
  ".csv": "text/csv",
  ".go": "text/x-go",
  ".java": "text/x-java",
  ".c": "text/x-c",
  ".cpp": "text/x-c++",
  ".rs": "text/x-rust",
  ".swift": "text/x-swift",
  ".kt": "text/x-kotlin",
  ".pdf": "application/pdf"
};
 
const TEXT_EXTENSIONS = new Set([
  ".json",
  ".js",
  ".mjs",
  ".cjs",
  ".ts",
  ".rb",
  ".py",
  ".txt",
  ".md",
  ".html",
  ".css",
  ".xml",
  ".yml",
  ".yaml",
  ".env",
  ".csv",
  ".go",
  ".java",
  ".c",
  ".cpp",
  ".rs",
  ".swift",
  ".kt"
]);
 
export class FileLoader {
  static async load(filePath: string): Promise<ContentPart> {
    if (filePath.startsWith("http")) {
      try {
        const response = await fetch(filePath);
        if (!response.ok) throw new Error(`Failed to fetch file: ${response.statusText}`);
 
        const buffer = await response.arrayBuffer();
        const contentTypeFull = response.headers.get("content-type") || "image/jpeg";
        const contentType = (contentTypeFull.split(";")[0] ?? "image/jpeg").trim();
        const base64 = Buffer.from(buffer).toString("base64");
        const dataUri = `data:${contentType};base64,${base64}`;
 
        if (contentType.startsWith("image/")) {
          return { type: "image_url", image_url: { url: dataUri } };
        }
 
        if (contentType.startsWith("audio/")) {
          const format = contentType.split("/")[1];
          return {
            type: "input_audio",
            input_audio: {
              data: base64,
              format: (format === "mpeg" ? "mp3" : format) ?? "wav"
            }
          };
        }
 
        Eif (contentType.startsWith("video/")) {
          return { type: "video_url", video_url: { url: dataUri } };
        }
 
        // Default to image_url for unknown binary or use as-is
        return { type: "image_url", image_url: { url: dataUri } };
      } catch {
        // Fallback to URL if fetch fails
        return { type: "image_url", image_url: { url: filePath } };
      }
    }
 
    if (filePath.startsWith("data:")) {
      return { type: "image_url", image_url: { url: filePath } };
    }
 
    const ext = path.extname(filePath).toLowerCase();
    const mime = MIME_TYPES[ext] ?? "application/octet-stream";
 
    if (TEXT_EXTENSIONS.has(ext)) {
      const content = await fs.readFile(filePath, "utf-8");
      return {
        type: "text",
        text: `\n\n--- File: ${path.basename(filePath)} ---\n${content}\n--- End of File ---\n`
      };
    }
 
    // Binary files (Images, Video, Audio)
    const data = await fs.readFile(filePath);
    const base64 = data.toString("base64");
    const dataUri = `data:${mime};base64,${base64}`;
 
    if (mime.startsWith("image/")) {
      return { type: "image_url", image_url: { url: dataUri } };
    }
 
    if (mime.startsWith("audio/")) {
      // OpenAI expects 'wav' or 'mp3' as format, not full mime
      const format = mime.split("/")[1];
      return {
        type: "input_audio",
        input_audio: {
          data: base64,
          format: (format === "mpeg" ? "mp3" : format) ?? "wav"
        }
      };
    }
 
    if (mime.startsWith("video/")) {
      // For now, treat video as a URL (some providers might support data URIs for video)
      return { type: "video_url", video_url: { url: dataUri } };
    }
 
    // Fallback for unknown binary types
    return { type: "image_url", image_url: { url: dataUri } };
  }
}