diff --git a/.fernignore b/.fernignore
index 19625584..7f3bf4cb 100644
--- a/.fernignore
+++ b/.fernignore
@@ -10,11 +10,15 @@ src/humanloop.client.ts
 src/overload.ts
 src/error.ts
 src/context.ts
+src/cli.ts
+src/cache
+src/sync 
 
 # Tests
 
 # Modified due to issues with OTEL
 tests/unit/fetcher/stream-wrappers/webpack.test.ts
+tests/custom/
 
 # CI Action
 
diff --git a/README.md b/README.md
index e1765775..6ac9ea37 100644
--- a/README.md
+++ b/README.md
@@ -91,6 +91,47 @@ try {
 }
 ```
 
+## Store Humanloop Files in Code
+
+Humanloop allows you to maintain Prompts and Agents in your local filesystem and version control, while still leveraging Humanloop's prompt management capabilities.
+
+### Syncing Files with the CLI
+
+```bash
+# Basic usage
+npx humanloop pull                               # Pull all files to 'humanloop/' directory
+npx humanloop pull --path="examples/chat"        # Pull specific directory
+npx humanloop pull --environment="production"    # Pull from specific environment
+npx humanloop pull --local-files-directory="ai"  # Specify local destination (default: "humanloop")
+
+# View available options
+npx humanloop pull --help
+```
+
+### Using Local Files in the SDK
+
+To use local Files in your code:
+
+```typescript
+// Enable local file support
+const client = new HumanloopClient({
+  apiKey: "YOUR_API_KEY",
+  useLocalFiles: true
+});
+
+// Call a local Prompt file
+const response = await client.prompts.call({
+  path: "examples/chat/basic",  // Looks for humanloop/examples/chat/basic.prompt
+  inputs: { query: "Hello world" }
+});
+
+// The same path-based approach works with prompts.log(), agents.call(), and agents.log()
+```
+
+For detailed instructions, see our [Guide on Storing Files in Code](https://humanloop.com/docs/v5/guides/prompts/store-prompts-in-code).
+
+For information about file formats, see our [File Format Reference](https://humanloop.com/docs/v5/reference/serialized-files).
+
 ## Pagination
 
 List endpoints are paginated. The SDK provides an iterator so that you can simply loop over the items:
diff --git a/jest.config.mjs b/jest.config.mjs
index c7248211..b4a8227b 100644
--- a/jest.config.mjs
+++ b/jest.config.mjs
@@ -3,6 +3,11 @@ export default {
     preset: "ts-jest",
     testEnvironment: "node",
     moduleNameMapper: {
-        "(.+)\.js$": "$1",
+        // Only map .js files in our src directory, not node_modules
+        "^src/(.+)\\.js$": "<rootDir>/src/$1",
     },
+    // Add transformIgnorePatterns to handle ESM modules in node_modules
+    transformIgnorePatterns: [
+        "node_modules/(?!(@traceloop|js-tiktoken|base64-js)/)",
+    ],
 };
diff --git a/package.json b/package.json
index ed2af786..0374d4f0 100644
--- a/package.json
+++ b/package.json
@@ -27,6 +27,8 @@
         "@traceloop/instrumentation-openai": ">=0.11.3",
         "@traceloop/ai-semantic-conventions": ">=0.11.6",
         "cli-progress": "^3.12.0",
+        "dotenv": "^16.5.0",
+        "commander": "^14.0.0",
         "lodash": "^4.17.21"
     },
     "devDependencies": {
@@ -46,7 +48,6 @@
         "openai": "^4.74.0",
         "@anthropic-ai/sdk": "^0.32.1",
         "cohere-ai": "^7.15.0",
-        "dotenv": "^16.4.6",
         "jsonschema": "^1.4.1",
         "@types/cli-progress": "^3.11.6",
         "@types/lodash": "4.14.74",
diff --git a/src/cache/LRUCache.ts b/src/cache/LRUCache.ts
new file mode 100644
index 00000000..30d0877b
--- /dev/null
+++ b/src/cache/LRUCache.ts
@@ -0,0 +1,48 @@
+/**
+ * LRU Cache implementation
+ */
+export default class LRUCache<K, V> {
+    private cache: Map<K, V>;
+    private readonly maxSize: number;
+
+    constructor(maxSize: number) {
+        this.cache = new Map<K, V>();
+        this.maxSize = maxSize;
+    }
+
+    get(key: K): V | undefined {
+        if (!this.cache.has(key)) {
+            return undefined;
+        }
+
+        // Get the value
+        const value = this.cache.get(key);
+
+        // Remove key and re-insert to mark as most recently used
+        this.cache.delete(key);
+        this.cache.set(key, value!);
+
+        return value;
+    }
+
+    set(key: K, value: V): void {
+        // If key already exists, refresh its position
+        if (this.cache.has(key)) {
+            this.cache.delete(key);
+        }
+        // If cache is full, remove the least recently used item (first item in the map)
+        else if (this.cache.size >= this.maxSize) {
+            const lruKey = this.cache.keys().next().value;
+            if (lruKey) {
+                this.cache.delete(lruKey);
+            }
+        }
+
+        // Add new key-value pair
+        this.cache.set(key, value);
+    }
+
+    clear(): void {
+        this.cache.clear();
+    }
+}
diff --git a/src/cache/index.ts b/src/cache/index.ts
new file mode 100644
index 00000000..d440ec99
--- /dev/null
+++ b/src/cache/index.ts
@@ -0,0 +1 @@
+export { default as LRUCache } from './LRUCache';
\ No newline at end of file
diff --git a/src/cli.ts b/src/cli.ts
new file mode 100644
index 00000000..6df8d05a
--- /dev/null
+++ b/src/cli.ts
@@ -0,0 +1,183 @@
+#!/usr/bin/env node
+import * as dotenv from "dotenv";
+import { Command } from "commander";
+import path from "path";
+
+import { HumanloopClient } from "./humanloop.client";
+import FileSyncer from "./sync/FileSyncer";
+import { SDK_VERSION } from "./version";
+
+dotenv.config();
+
+const LogType = {
+    SUCCESS: "\x1b[92m", // green
+    ERROR: "\x1b[91m", // red
+    INFO: "\x1b[96m", // cyan
+    WARN: "\x1b[93m", // yellow
+    RESET: "\x1b[0m",
+} as const;
+
+function log(message: string, type: keyof typeof LogType): void {
+    console.log(`${LogType[type]}${message}${LogType.RESET}`);
+}
+
+const program = new Command();
+program
+    .name("humanloop")
+    .description("Humanloop CLI for managing sync operations")
+    .version(SDK_VERSION);
+
+interface CommonOptions {
+    apiKey?: string;
+    envFile?: string;
+    baseUrl?: string;
+    localFilesDirectory?: string;
+}
+
+interface PullOptions extends CommonOptions {
+    path?: string;
+    environment?: string;
+    verbose?: boolean;
+    quiet?: boolean;
+}
+
+const addCommonOptions = (command: Command) =>
+    command
+        .option("--api-key <apiKey>", "Humanloop API key")
+        .option("--env-file <envFile>", "Path to .env file")
+        .option("--base-url <baseUrl>", "Base URL for Humanloop API")
+        .option(
+            "--local-dir, --local-files-directory <dir>",
+            "Directory where Humanloop files are stored locally (default: humanloop/)",
+            "humanloop",
+        );
+
+// Instantiate a HumanloopClient for the CLI
+function getClient(options: CommonOptions): HumanloopClient {
+    if (options.envFile) {
+        const result = dotenv.config({ path: options.envFile });
+        if (result.error) {
+            log(
+                `Failed to load environment file: ${options.envFile} (file not found or invalid format)`,
+                "ERROR",
+            );
+            process.exit(1);
+        }
+    }
+
+    const apiKey = options.apiKey || process.env.HUMANLOOP_API_KEY;
+    if (!apiKey) {
+        log(
+            "No API key found. Set HUMANLOOP_API_KEY in .env file or environment, or use --api-key",
+            "ERROR",
+        );
+        process.exit(1);
+    }
+
+    return new HumanloopClient({
+        apiKey,
+        baseUrl: options.baseUrl,
+        localFilesDirectory: options.localFilesDirectory,
+    });
+}
+
+// Helper to handle sync errors
+function handleSyncErrors<T extends CommonOptions>(fn: (options: T) => Promise<void>) {
+    return async (options: T) => {
+        try {
+            await fn(options);
+        } catch (error) {
+            log(`Error: ${error}`, "ERROR");
+            process.exit(1);
+        }
+    };
+}
+
+// Pull command
+addCommonOptions(
+    program
+        .command("pull")
+        .description(
+            "Pull Prompt and Agent files from Humanloop to your local filesystem.\n\n" +
+                "This command will:\n" +
+                "1. Fetch Prompt and Agent files from your Humanloop workspace\n" +
+                "2. Save them to your local filesystem (directory specified by --local-files-directory, default: humanloop/)\n" +
+                "3. Maintain the same directory structure as in Humanloop\n" +
+                "4. Add appropriate file extensions (.prompt or .agent)\n\n" +
+                "For example, with the default --local-files-directory=humanloop, files will be saved as:\n" +
+                "./humanloop/\n" +
+                "├── my_project/\n" +
+                "│   ├── prompts/\n" +
+                "│   │   ├── my_prompt.prompt\n" +
+                "│   │   └── nested/\n" +
+                "│   │       └── another_prompt.prompt\n" +
+                "│   └── agents/\n" +
+                "│       └── my_agent.agent\n" +
+                "└── another_project/\n" +
+                "    └── prompts/\n" +
+                "        └── other_prompt.prompt\n\n" +
+                "If you specify --local-files-directory=data/humanloop, files will be saved in ./data/humanloop/ instead.\n\n" +
+                "If a file exists both locally and in the Humanloop workspace, the local file will be overwritten\n" +
+                "with the version from Humanloop. Files that only exist locally will not be affected.\n\n" +
+                "Currently only supports syncing Prompt and Agent files. Other file types will be skipped.",
+        )
+        .option(
+            "-p, --path <path>",
+            "Path in the Humanloop workspace to pull from (file or directory). " +
+                "You can pull an entire directory (e.g. 'my/directory') or a specific file (e.g. 'my/directory/my_prompt.prompt'). " +
+                "When pulling a directory, all files within that directory and its subdirectories will be included. " +
+                "Paths should not contain leading or trailing slashes. " +
+                "If not specified, pulls from the root of the remote workspace.",
+        )
+        .option(
+            "-e, --environment <env>",
+            "Environment to pull from (e.g. 'production', 'staging')",
+        )
+        .option("-v, --verbose", "Show detailed information about the operation")
+        .option("-q, --quiet", "Suppress output of successful files"),
+).action(
+    handleSyncErrors(async (options: PullOptions) => {
+        const client = getClient(options);
+
+        // Create a separate FileSyncer instance with log level based on verbose flag only
+        const fileSyncer = new FileSyncer(client, {
+            baseDir: options.localFilesDirectory,
+            verbose: options.verbose,
+        });
+
+        log("Pulling files from Humanloop...", "INFO");
+        log(`Path: ${options.path || "(root)"}`, "INFO");
+        log(`Environment: ${options.environment || "(default)"}`, "INFO");
+
+        const startTime = Date.now();
+        const [successfulFiles, failedFiles] = await fileSyncer.pull(
+            options.path,
+            options.environment,
+        );
+        const duration = Date.now() - startTime;
+
+        // Always show operation result
+        const isSuccessful = failedFiles.length === 0;
+        log(`Pull completed in ${duration}ms`, isSuccessful ? "SUCCESS" : "ERROR");
+
+        // Only suppress successful files output if quiet flag is set
+        if (successfulFiles.length > 0 && !options.quiet) {
+            console.log(); // Empty line
+            log(`Successfully pulled ${successfulFiles.length} files:`, "SUCCESS");
+            for (const file of successfulFiles) {
+                log(`  ✓ ${file}`, "SUCCESS");
+            }
+        }
+
+        // Always show failed files
+        if (failedFiles.length > 0) {
+            console.log(); // Empty line
+            log(`Failed to pull ${failedFiles.length} files:`, "ERROR");
+            for (const file of failedFiles) {
+                log(`  ✗ ${file}`, "ERROR");
+            }
+        }
+    }),
+);
+
+program.parse(process.argv);
diff --git a/src/humanloop.client.ts b/src/humanloop.client.ts
index ac7cb197..998632a2 100644
--- a/src/humanloop.client.ts
+++ b/src/humanloop.client.ts
@@ -8,10 +8,6 @@ import { OpenAIInstrumentation } from "@traceloop/instrumentation-openai";
 import { HumanloopClient as BaseHumanloopClient } from "./Client";
 import { ChatMessage } from "./api";
 import { Evaluations as BaseEvaluations } from "./api/resources/evaluations/client/Client";
-import { Evaluators } from "./api/resources/evaluators/client/Client";
-import { Flows } from "./api/resources/flows/client/Client";
-import { Prompts } from "./api/resources/prompts/client/Client";
-import { Tools } from "./api/resources/tools/client/Client";
 import { ToolKernelRequest } from "./api/types/ToolKernelRequest";
 import { flowUtilityFactory } from "./decorators/flow";
 import { promptDecoratorFactory } from "./decorators/prompt";
@@ -28,7 +24,8 @@ import {
 } from "./evals/types";
 import { HumanloopSpanExporter } from "./otel/exporter";
 import { HumanloopSpanProcessor } from "./otel/processor";
-import { overloadCall, overloadLog } from "./overload";
+import { overloadClient } from "./overload";
+import { FileSyncer } from "./sync";
 import { SDK_VERSION } from "./version";
 
 const RED = "\x1b[91m";
@@ -199,17 +196,48 @@ class HumanloopTracerSingleton {
     }
 }
 
+export interface HumanloopClientOptions extends BaseHumanloopClient.Options {
+    /**
+     * Whether to use local files for prompts and agents
+     */
+    useLocalFiles?: boolean;
+
+    /**
+     * Base directory where local prompt and agent files are stored (default: "humanloop").
+     * This is relative to the current working directory. For example:
+     * - "humanloop" will look for files in "./humanloop/"
+     * - "data/humanloop" will look for files in "./data/humanloop/"
+     * When using paths in the API, they must be relative to this directory. For example,
+     * if localFilesDirectory="humanloop" and you have a file at "humanloop/samples/test.prompt",
+     * you would reference it as "samples/test" in your code.
+     */
+    localFilesDirectory?: string;
+
+    /**
+     * Maximum number of files to cache when useLocalFiles is true (default: DEFAULT_CACHE_SIZE).
+     * This parameter has no effect if useLocalFiles is false.
+     */
+    cacheSize?: number;
+
+    /**
+     * LLM provider modules to instrument. Allows the prompt decorator to spy on provider calls and log them to Humanloop
+     */
+    instrumentProviders?: {
+        OpenAI?: any;
+        Anthropic?: any;
+        CohereAI?: any;
+    };
+}
+
 export class HumanloopClient extends BaseHumanloopClient {
     protected readonly _evaluations: ExtendedEvaluations;
-    protected readonly _prompts_overloaded: Prompts;
-    protected readonly _flows_overloaded: Flows;
-    protected readonly _tools_overloaded: Tools;
-    protected readonly _evaluators_overloaded: Evaluators;
     protected readonly instrumentProviders: {
         OpenAI?: any;
         Anthropic?: any;
         CohereAI?: any;
     };
+    protected readonly _fileSyncer: FileSyncer;
+    protected readonly useLocalFiles: boolean;
 
     protected get opentelemetryTracer(): Tracer {
         return HumanloopTracerSingleton.getInstance({
@@ -243,29 +271,32 @@ export class HumanloopClient extends BaseHumanloopClient {
      * const anthropic = new Anthropic({apiKey: process.env.ANTHROPIC_KEY});
      * ```
      */
-    constructor(
-        _options: BaseHumanloopClient.Options & {
-            instrumentProviders?: {
-                OpenAI?: any;
-                Anthropic?: any;
-                CohereAI?: any;
-            };
-        },
-    ) {
-        super(_options);
+    constructor(options: HumanloopClientOptions = {}) {
+        super(options);
 
-        this.instrumentProviders = _options.instrumentProviders || {};
+        this.useLocalFiles = options.useLocalFiles || false;
 
-        this._prompts_overloaded = overloadLog(super.prompts);
-        this._prompts_overloaded = overloadCall(this._prompts_overloaded);
+        // Warn user if cacheSize is non-default but useLocalFiles is false
+        if (!this.useLocalFiles && options.cacheSize !== undefined) {
+            console.warn(
+                `The specified cacheSize=${options.cacheSize} will have no effect because useLocalFiles=false. ` +
+                    `File caching is only active when local files are enabled.`,
+            );
+        }
 
-        this._tools_overloaded = overloadLog(super.tools);
+        this._fileSyncer = new FileSyncer(this, {
+            baseDir: options.localFilesDirectory || "humanloop",
+            cacheSize: options.cacheSize,
+        });
 
-        this._flows_overloaded = overloadLog(super.flows);
+        this.instrumentProviders = options.instrumentProviders || {};
 
-        this._evaluators_overloaded = overloadLog(super.evaluators);
+        overloadClient(super.prompts, this._fileSyncer, this.useLocalFiles);
+        overloadClient(super.flows, this._fileSyncer, this.useLocalFiles);
+        overloadClient(super.tools, this._fileSyncer, this.useLocalFiles);
+        overloadClient(super.evaluators, this._fileSyncer, this.useLocalFiles);
 
-        this._evaluations = new ExtendedEvaluations(_options, this);
+        this._evaluations = new ExtendedEvaluations(options, this);
 
         // Initialize the tracer singleton
         HumanloopTracerSingleton.getInstance({
@@ -359,14 +390,14 @@ ${RESET}`,
      *       temperature: 0.5,
      *     });
      *     const openaiContent = openaiResponse.choices[0].message.content;
-     *
+    
      *     const anthropicClient = new Anthropic({ apiKey: process.env.ANTHROPIC_API_KEY });
      *     const anthropicResponse = await anthropicClient.messages.create({
      *       model: "claude-3-5-sonnet-20240620",
      *       temperature: 0.5,
      *     });
      *     const anthropicContent = anthropicResponse.content;
-     *
+    
      *     return { openaiContent, anthropicContent };
      *   }
      * });
@@ -560,23 +591,59 @@ ${RESET}`,
         );
     }
 
-    public get evaluations(): ExtendedEvaluations {
-        return this._evaluations;
-    }
-
-    public get prompts(): Prompts {
-        return this._prompts_overloaded;
-    }
-
-    public get flows(): Flows {
-        return this._flows_overloaded;
-    }
-
-    public get tools(): Tools {
-        return this._tools_overloaded;
+    /**
+     * Pull Prompt and Agent files from Humanloop to local filesystem.
+     *
+     * This method will:
+     * 1. Fetch Prompt and Agent files from your Humanloop workspace
+     * 2. Save them to your local filesystem (directory specified by `localFilesDirectory`, default: "humanloop")
+     * 3. Maintain the same directory structure as in Humanloop
+     * 4. Add appropriate file extensions (`.prompt` or `.agent`)
+     *
+     * The path parameter can be used in two ways:
+     * - If it points to a specific file (e.g. "path/to/file.prompt" or "path/to/file.agent"), only that file will be pulled
+     * - If it points to a directory (e.g. "path/to/directory"), all Prompt and Agent files in that directory and its subdirectories will be pulled
+     * - If no path is provided, all Prompt and Agent files will be pulled
+     *
+     * The operation will overwrite existing files with the latest version from Humanloop
+     * but will not delete local files that don't exist in the remote workspace.
+     *
+     * Currently only supports syncing Prompt and Agent files. Other file types will be skipped.
+     *
+     * For example, with the default `localFilesDirectory="humanloop"`, files will be saved as:
+     * ```
+     * ./humanloop/
+     * ├── my_project/
+     * │   ├── prompts/
+     * │   │   ├── my_prompt.prompt
+     * │   │   └── nested/
+     * │   │       └── another_prompt.prompt
+     * │   └── agents/
+     * │       └── my_agent.agent
+     * └── another_project/
+     *     └── prompts/
+     *         └── other_prompt.prompt
+     * ```
+     *
+     * If you specify `localFilesDirectory="data/humanloop"`, files will be saved in ./data/humanloop/ instead.
+     *
+     * @param path - Optional path to either a specific file (e.g. "path/to/file.prompt") or a directory (e.g. "path/to/directory").
+     *              If not provided, all Prompt and Agent files will be pulled.
+     * @param environment - The environment to pull the files from.
+     * @returns An array containing two string arrays:
+     *          - First array contains paths of successfully synced files
+     *          - Second array contains paths of files that failed to sync (due to API errors, missing content,
+     *            or filesystem issues)
+     * @throws HumanloopRuntimeError If there's an error communicating with the API
+     */
+    public async pull(
+        path?: string,
+        environment?: string,
+    ): Promise<[string[], string[]]> {
+        return this._fileSyncer.pull(path, environment);
     }
 
-    public get evaluators(): Evaluators {
-        return this._evaluators_overloaded;
+    public get evaluations(): ExtendedEvaluations {
+        return this._evaluations;
     }
 }
diff --git a/src/overload.ts b/src/overload.ts
index dd66643a..5dff103b 100644
--- a/src/overload.ts
+++ b/src/overload.ts
@@ -1,44 +1,73 @@
+import path from "path";
+
 import {
     CreateEvaluatorLogRequest,
+    FileType,
     FlowLogRequest,
-    PromptCallResponse,
     PromptLogRequest,
     ToolLogRequest,
 } from "./api";
+import { Agents } from "./api/resources/agents/client/Client";
+import { Datasets } from "./api/resources/datasets/client/Client";
 import { Evaluators } from "./api/resources/evaluators/client/Client";
 import { Flows } from "./api/resources/flows/client/Client";
 import { Prompts } from "./api/resources/prompts/client/Client";
 import { Tools } from "./api/resources/tools/client/Client";
 import { getDecoratorContext, getEvaluationContext, getTraceId } from "./context";
 import { HumanloopRuntimeError } from "./error";
+import FileSyncer, {
+    SERIALIZABLE_FILE_TYPES,
+    SerializableFileType,
+} from "./sync/FileSyncer";
 
-export function overloadLog<T extends Flows | Prompts | Tools | Evaluators>(
-    client: T,
+type ClientType = Flows | Agents | Prompts | Tools | Evaluators | Datasets;
+type LogRequestType =
+    | FlowLogRequest
+    | PromptLogRequest
+    | ToolLogRequest
+    | CreateEvaluatorLogRequest;
+
+/**
+ * Get the file type based on the client type.
+ * 
+ * @param client Client instance to check
+ * @returns The file type corresponding to the client, or null if not a file type that supports local files
+ */
+function getFileTypeFromClient(client: ClientType): SerializableFileType | null {
+    if (client instanceof Prompts) {
+        return "prompt";
+    } else if (client instanceof Agents) {
+        return "agent";
+    } else if (client instanceof Tools) {
+        return null; // Tools don't support local files
+    } else if (client instanceof Flows) {
+        return null; // Flows don't support local files
+    } else if (client instanceof Evaluators) {
+        return null; // Evaluators don't support local files
+    } else if (client instanceof Datasets) {
+        return null; // Datasets don't support local files
+    } else {
+        throw new HumanloopRuntimeError(
+            // @ts-ignore Client shouldn't be of a type other than those checked above, but included as a safeguard
+            `Unsupported client type: ${client.constructor.name}`,
+        );
+    }
+}
+
+/**
+ * Handle tracing context for both log and call methods.
+ * 
+ * @param request The API request
+ * @param client The client making the request
+ * @returns The updated request with tracing context applied
+ */
+function handleTracingContext<T extends LogRequestType>(
+    request: T,
+    client: ClientType,
 ): T {
-    const originalLog = client.log.bind(client);
-
-    const _overloadedLog = async (
-        request: T extends Flows
-            ? FlowLogRequest
-            : T extends Prompts
-              ? PromptLogRequest
-              : T extends Tools
-                ? ToolLogRequest
-                : T extends Evaluators
-                  ? CreateEvaluatorLogRequest
-                  : never,
-        options?: T extends Flows
-            ? Flows.RequestOptions
-            : T extends Prompts
-              ? Prompts.RequestOptions
-              : T extends Tools
-                ? Tools.RequestOptions
-                : T extends Evaluators
-                  ? Evaluators.RequestOptions
-                  : never,
-    ) => {
-        const traceId = getTraceId();
-        if (traceId !== undefined && client instanceof Flows) {
+    const traceId = getTraceId();
+    if (traceId !== undefined) {
+        if (client instanceof Flows) {
             const context = getDecoratorContext();
             if (context === undefined) {
                 throw new HumanloopRuntimeError(
@@ -46,85 +75,291 @@ export function overloadLog<T extends Flows | Prompts | Tools | Evaluators>(
                 );
             }
             throw new HumanloopRuntimeError(
-                `Using flows.log() is not allowed: Flow decorator for File ${context.path} manages the tracing and trace completion.`,
+                `Using \`flows.log()\` is not allowed: Flow decorator ` +
+                `for File ${context.path} manages the tracing and trace completion.`,
             );
         }
 
-        if (traceId !== undefined) {
-            if ("traceParentId" in request) {
-                console.warn(
-                    "Ignoring trace_parent_id argument: the Flow decorator manages tracing.",
+        if ("traceParentId" in request) {
+            console.warn(
+                "Ignoring trace_parent_id argument: the Flow decorator manages tracing.",
+            );
+        }
+        return {
+            ...request,
+            traceParentId: traceId,
+        };
+    }
+    return request;
+}
+
+/**
+ * Load prompt/agent file content from local filesystem into API request.
+ *
+ * Retrieves the file content at the specified path and adds it to request
+ * under the appropriate field ('prompt' or 'agent'), allowing local files
+ * to be used in API calls instead of fetching from Humanloop API.
+ *
+ * @param request API request object
+ * @param client Client instance making the call
+ * @param fileSyncer FileSyncer handling local file operations
+ * @returns Updated request with file content in the appropriate field
+ * @throws HumanloopRuntimeError On validation or file loading failures.
+ *   For example, an invalid path format (absolute paths, leading/trailing slashes, etc.) 
+ *   or a file not being found.
+ */
+function handleLocalFiles<T extends LogRequestType>(
+    request: T,
+    client: ClientType,
+    fileSyncer: FileSyncer,
+): T {
+    // Validate request has either id or path, but not both
+    if ("id" in request && "path" in request) {
+        throw new HumanloopRuntimeError("Can only specify one of `id` or `path`");
+    }
+    if (!("id" in request) && !("path" in request)) {
+        throw new HumanloopRuntimeError("Must specify either `id` or `path`");
+    }
+
+    // If using id, we can't use local files
+    if ("id" in request) {
+        return request;
+    }
+
+    const filePath = request.path?.trim();
+    if (!filePath) {
+        throw new HumanloopRuntimeError("Path cannot be empty");
+    }
+
+    // First check for path format issues (absolute paths or leading/trailing slashes)
+    const normalizedPath = filePath.trim().replace(/^\/+|\/+$/g, "");
+    if (path.isAbsolute(filePath) || filePath !== normalizedPath) {
+        throw new HumanloopRuntimeError(
+            `Path '${filePath}' format is invalid. ` +
+            `Paths must follow the standard API format 'path/to/resource' without leading or trailing slashes. ` +
+            `Please use '${normalizedPath}' instead.`,
+        );
+    }
+
+    // Then check for file extensions
+    if (fileSyncer.isFile(filePath)) {
+        const pathWithoutExtension = path.join(
+            path.dirname(filePath),
+            path.basename(filePath, path.extname(filePath)),
+        );
+        throw new HumanloopRuntimeError(
+            `Path '${filePath}' should not include any file extensions in API calls. ` +
+            `When referencing files via the \`path\` parameter, use the path without extensions: '${pathWithoutExtension}'. ` +
+            `Note: File extensions are only used when pulling specific files via the CLI.`,
+        );
+    }
+
+    // Check if version_id or environment is specified
+    const useRemote = "versionId" in request || "environment" in request;
+    if (useRemote) {
+        throw new HumanloopRuntimeError(
+            `Cannot use local file for \`${filePath}\` as version_id or environment was specified. ` +
+            `Please either remove version_id/environment to use local files, or set use_local_files=False to use remote files.`,
+        );
+    }
+
+    const fileType = getFileTypeFromClient(client);
+    if (!fileType || !SERIALIZABLE_FILE_TYPES.has(fileType)) {
+        throw new HumanloopRuntimeError(
+            `Local files are not supported for \`${fileType?.charAt(0).toUpperCase()}${fileType?.slice(1)}\` files: '${filePath}'.`,
+        );
+    }
+
+    // If file_type is already specified in request, prioritize user-provided value
+    if (fileType in request && typeof request[fileType as keyof T] !== "string") {
+        console.warn(
+            `Ignoring local file for \`${filePath}\` as ${fileType} parameters were directly provided. ` +
+            `Using provided parameters instead.`,
+        );
+        return request;
+    }
+
+    try {
+        const fileContent = fileSyncer.getFileContent(filePath, fileType);
+        return {
+            ...request,
+            [fileType]: fileContent,
+        } as T;
+    } catch (error) {
+        throw new HumanloopRuntimeError(
+            `Failed to use local file for \`${filePath}\`: ${error}`,
+        );
+    }
+}
+
+/**
+ * Handle evaluation context for logging.
+ * 
+ * @param request The API request
+ * @returns Tuple of [updated request, callback function]
+ */
+function handleEvaluationContext<T extends LogRequestType>(
+    request: T,
+): [T, ((id: string) => Promise<void>) | null] {
+    const evaluationContext = getEvaluationContext();
+    if (evaluationContext !== undefined) {
+        const [newRequest, callback] = evaluationContext.logArgsWithContext({
+            logArgs: request,
+            forOtel: true,
+            path: request.path,
+        });
+        return [newRequest as T, callback];
+    }
+    return [request, null];
+}
+
+/**
+ * Overloaded log method implementation.
+ * Handles tracing context, local file loading, and evaluation context.
+ * 
+ * @param self The client instance
+ * @param fileSyncer Optional FileSyncer for local file operations
+ * @param useLocalFiles Whether to use local files
+ * @param request The log request
+ * @param options Additional options
+ * @returns The log response
+ */
+async function overloadedLog<T extends ClientType>(
+    self: T,
+    fileSyncer: FileSyncer | undefined,
+    useLocalFiles: boolean,
+    request: LogRequestType,
+    options?: any,
+) {
+    try {
+        // Special handling for flows - prevent direct log usage
+        if (self instanceof Flows && getTraceId() !== undefined) {
+            const context = getDecoratorContext();
+            if (context === undefined) {
+                throw new HumanloopRuntimeError(
+                    "Internal error: trace_id context is set outside a decorator context.",
                 );
             }
-            request = {
-                ...request,
-                traceParentId: traceId,
-            };
+            throw new HumanloopRuntimeError(
+                `Using \`flows.log()\` is not allowed: Flow decorator ` +
+                `for File ${context.path} manages the tracing and trace completion.`,
+            );
         }
 
-        const evaluationContext = getEvaluationContext();
-        if (evaluationContext !== undefined) {
-            const [kwargsEval, evalCallback] = evaluationContext.logArgsWithContext({
-                logArgs: request,
-                forOtel: true,
-                path: request.path,
-            });
-            try {
-                // @ts-ignore Polymorphism alarms the type checker
-                const response = await originalLog(kwargsEval, options);
-                if (evalCallback !== null) {
-                    await evalCallback(response.id);
-                }
-                return response;
-            } catch (e) {
-                throw new HumanloopRuntimeError(String(e));
-            }
-        } else {
-            try {
-                // @ts-ignore Polymorphism alarms the type checker
-                return await originalLog(request, options);
-            } catch (e) {
-                throw new HumanloopRuntimeError(String(e));
+        request = handleTracingContext(request, self);
+
+        // Handle loading files from local filesystem when using Prompt and Agent clients
+        if (
+            useLocalFiles &&
+            (self instanceof Prompts || self instanceof Agents)
+        ) {
+            if (!fileSyncer) {
+                throw new HumanloopRuntimeError(
+                    "SDK initialization error: fileSyncer is missing but required for local file operations. " +
+                    "This is likely a bug in the SDK initialization - please report this issue to the Humanloop team.",
+                );
             }
+            request = handleLocalFiles(request, self, fileSyncer);
         }
-    };
-
-    // @ts-ignore
-    client.log = _overloadedLog.bind(client);
-    // @ts-ignore
-    client._log = originalLog.bind(client);
 
-    return client;
+        const [evalRequest, evalCallback] = handleEvaluationContext(request);
+        const response = await (self as any)._log(evalRequest, options);
+        
+        if (evalCallback !== null) {
+            await evalCallback(response.id);
+        }
+        return response;
+    } catch (error) {
+        if (error instanceof HumanloopRuntimeError) {
+            throw error;
+        }
+        throw new HumanloopRuntimeError(String(error));
+    }
 }
 
-export function overloadCall(client: Prompts): Prompts {
-    const originalCall = client.call.bind(client);
-
-    const _overloadedCall = async (
-        request: PromptLogRequest,
-        options?: Prompts.RequestOptions,
-    ): Promise<PromptCallResponse> => {
-        const traceId = getTraceId();
-        if (traceId !== undefined) {
-            if ("traceParentId" in request) {
-                console.warn(
-                    "Ignoring trace_parent_id argument: the Flow decorator manages tracing.",
+/**
+ * Overloaded call method implementation.
+ * Handles tracing context and local file loading.
+ * 
+ * @param self The client instance
+ * @param fileSyncer Optional FileSyncer for local file operations
+ * @param useLocalFiles Whether to use local files
+ * @param request The call request
+ * @param options Additional options
+ * @returns The call response
+ */
+async function overloadedCall<T extends ClientType>(
+    self: T,
+    fileSyncer: FileSyncer | undefined,
+    useLocalFiles: boolean,
+    request: any,
+    options?: any,
+) {
+    try {
+        request = handleTracingContext(request, self);
+        
+        // If `useLocalFiles` flag is True, we should use local file content for
+        // `call` operations on Prompt and Agent clients.
+        if (useLocalFiles && (self instanceof Prompts || self instanceof Agents)) {
+            if (!fileSyncer) {
+                throw new HumanloopRuntimeError(
+                    "fileSyncer is required for clients that support call operations",
                 );
             }
-            request = {
-                ...request,
-                traceParentId: traceId,
-            };
+            request = handleLocalFiles(request, self, fileSyncer);
         }
-
-        try {
-            return await originalCall(request, options);
-        } catch (e) {
-            throw new HumanloopRuntimeError(String(e));
+        
+        return await (self as any)._call(request, options);
+    } catch (error) {
+        if (error instanceof HumanloopRuntimeError) {
+            throw error;
         }
-    };
+        throw new HumanloopRuntimeError(String(error));
+    }
+}
 
-    client.call = _overloadedCall.bind(client);
+/**
+ * Overloads client methods to add tracing, local file handling, and evaluation context.
+ * 
+ * This function enhances clients by:
+ * 1. Adding tracing context to requests for Flow integration
+ * 2. Supporting local file loading for Prompt and Agent clients
+ * 3. Handling evaluation context for logging
+ * 
+ * @param client The client to overload
+ * @param fileSyncer Optional FileSyncer for local file operations
+ * @param useLocalFiles Whether to use local files (default: false)
+ * @returns The overloaded client
+ * @throws HumanloopRuntimeError If fileSyncer is missing but required
+ */
+export function overloadClient<T extends ClientType>(
+    client: T,
+    fileSyncer?: FileSyncer,
+    useLocalFiles: boolean = false,
+): T {
+    // Handle log method if it exists
+    if ("log" in client) {
+        const originalLog = (client as any).log.bind(client);
+        (client as any)._log = originalLog;
+        (client as any).log = async (request: LogRequestType, options?: any) => {
+            return overloadedLog(client, fileSyncer, useLocalFiles, request, options);
+        };
+    }
+
+    // Handle call method if it exists (for Prompts and Agents)
+    if (client instanceof Prompts || client instanceof Agents) {
+        // Verify fileSyncer is provided if needed
+        if (fileSyncer === undefined && useLocalFiles) {
+            console.error("fileSyncer is undefined but client has call method and useLocalFiles=%s", useLocalFiles);
+            throw new HumanloopRuntimeError("fileSyncer is required for clients that support call operations");
+        }
+        
+        const originalCall = (client as any).call.bind(client);
+        (client as any)._call = originalCall;
+        (client as any).call = async (request: any, options?: any) => {
+            return overloadedCall(client, fileSyncer, useLocalFiles, request, options);
+        };
+    }
 
     return client;
-}
+}
\ No newline at end of file
diff --git a/src/pathUtils.ts b/src/pathUtils.ts
new file mode 100644
index 00000000..5a2ba125
--- /dev/null
+++ b/src/pathUtils.ts
@@ -0,0 +1,47 @@
+import * as path from "path";
+
+/**
+ * Normalize a path to the standard Humanloop API format.
+ *
+ * This function is primarily used when interacting with the Humanloop API to ensure paths
+ * follow the standard format: 'path/to/resource' without leading/trailing slashes.
+ * It's used when pulling files from Humanloop to local filesystem (see FileSyncer.pull)
+ *
+ * The function:
+ * - Converts Windows backslashes to forward slashes
+ * - Normalizes consecutive slashes
+ * - Optionally strips file extensions (e.g. .prompt, .agent)
+ * - Removes leading/trailing slashes to match API conventions
+ *
+ * Leading/trailing slashes are stripped because the Humanloop API expects paths in the
+ * format 'path/to/resource' without them. This is consistent with how the API stores
+ * and references files, and ensures paths work correctly in both API calls and local
+ * filesystem operations.
+ *
+ * @param pathStr - The path to normalize. Can be a Windows or Unix-style path.
+ * @param stripExtension - If true, removes the file extension (e.g. .prompt, .agent)
+ * @returns Normalized path string in the format 'path/to/resource'
+ */
+export function normalizePath(
+    pathStr: string,
+    stripExtension: boolean = false,
+): string {
+    // Convert Windows backslashes to forward slashes
+    let normalizedPath = pathStr.replace(/\\/g, "/");
+
+    // Use path.posix to handle path normalization (handles consecutive slashes and . /..)
+    normalizedPath = path.posix.normalize(normalizedPath);
+
+    // Remove leading/trailing slashes
+    normalizedPath = normalizedPath.replace(/^\/+|\/+$/g, "");
+
+    // Strip extension if requested 
+    if (stripExtension && normalizedPath.includes(".")) {
+        normalizedPath = path.posix.join(
+            path.posix.dirname(normalizedPath),
+            path.posix.basename(normalizedPath, path.posix.extname(normalizedPath)),
+        );
+    }
+
+    return normalizedPath;
+}
diff --git a/src/sync/FileSyncer.ts b/src/sync/FileSyncer.ts
new file mode 100644
index 00000000..23aa97d1
--- /dev/null
+++ b/src/sync/FileSyncer.ts
@@ -0,0 +1,428 @@
+import { FileType } from "api";
+import fs from "fs";
+import path from "path";
+
+import * as pathUtils from "../pathUtils";
+import LRUCache from "../cache/LRUCache";
+import { HumanloopRuntimeError } from "../error";
+import { HumanloopClient } from "../humanloop.client";
+
+// Default cache size for file content caching
+const DEFAULT_CACHE_SIZE = 100;
+
+// File types that can be serialized to/from the filesystem
+export type SerializableFileType = "prompt" | "agent";
+export const SERIALIZABLE_FILE_TYPES = new Set<SerializableFileType>([
+    "prompt",
+    "agent",
+]);
+
+export interface FileSyncerOptions {
+    baseDir?: string;
+    cacheSize?: number;
+    verbose?: boolean;
+}
+
+// Simple logging with color and verbosity control
+const LogType = {
+    DEBUG: "\x1b[90m", // gray
+    INFO: "\x1b[96m", // cyan
+    WARN: "\x1b[93m", // yellow
+    ERROR: "\x1b[91m", // red
+    RESET: "\x1b[0m",
+} as const;
+
+function log(
+    message: string,
+    type: keyof typeof LogType,
+    verbose: boolean = false,
+): void {
+    // Only show debug/info if verbose is true
+    if ((type === "DEBUG" || type === "INFO") && !verbose) return;
+    console.log(`${LogType[type]}${message}${LogType.RESET}`);
+}
+
+/**
+ * Format API error messages to be more user-friendly.
+ */
+function formatApiError(error: Error, verbose: boolean = false): string {
+    const errorMsg = error.message || String(error);
+    try {
+        const detail = JSON.parse(errorMsg);
+        if (typeof detail === "string") {
+            return detail;
+        } else if (typeof detail === "object") {
+            return detail.description || detail.msg || errorMsg;
+        }
+        return errorMsg;
+    } catch (e) {
+        log(`Failed to parse error message: ${e}`, "DEBUG", verbose);
+        return errorMsg;
+    }
+}
+
+/**
+ * Client for synchronizing Prompt and Agent files between Humanloop workspace and local filesystem.
+ *
+ * This client enables a local development workflow by:
+ * 1. Pulling files from Humanloop workspace to local filesystem
+ * 2. Maintaining the same directory structure locally as in Humanloop
+ * 3. Storing files in human-readable, version-control friendly formats (.prompt and .agent)
+ * 4. Supporting local file access in the SDK when configured with use_local_files=true
+ *
+ * Files maintain their relative paths from the Humanloop workspace (with appropriate extensions added),
+ * allowing for seamless reference between local and remote environments using the same path identifiers.
+ */
+export default class FileSyncer {
+    // Default page size for API pagination when listing Files
+    private static readonly PAGE_SIZE = 100;
+
+    private readonly client: HumanloopClient;
+    private readonly baseDir: string;
+    private readonly cacheSize: number;
+    private readonly fileContentCache: LRUCache<string, string>;
+    private readonly verbose: boolean;
+
+    constructor(client: HumanloopClient, options: FileSyncerOptions = {}) {
+        this.client = client;
+        this.baseDir = options.baseDir || "humanloop";
+        this.cacheSize = options.cacheSize || DEFAULT_CACHE_SIZE;
+        this.fileContentCache = new LRUCache<string, string>(this.cacheSize);
+        this.verbose = options.verbose || false;
+    }
+
+    /**
+     * Implementation of get_file_content without the cache decorator.
+     *
+     * This is the actual implementation that gets wrapped by LRU cache.
+     *
+     * @param filePath The API path to the file (e.g. `path/to/file`)
+     * @param fileType The type of file to get the content of (SerializableFileType)
+     * @returns The raw file content
+     * @throws HumanloopRuntimeError If the file doesn't exist or can't be read
+     */
+    private _getFileContentImplementation(
+        filePath: string,
+        fileType: SerializableFileType,
+    ): string {
+        const fullPath = path.join(this.baseDir, `${filePath}.${fileType}`);
+        try {
+            // Read the raw file content
+            const fileContent = fs.readFileSync(fullPath, "utf8");
+            log(`Using local file content from ${fullPath}`, "DEBUG", this.verbose);
+            return fileContent;
+        } catch (error) {
+            throw new HumanloopRuntimeError(
+                `Failed to read ${fileType} ${filePath} from disk: ${error}`,
+            );
+        }
+    }
+
+    /**
+     * Get the raw file content of a file from cache or filesystem.
+     *
+     * This method uses an LRU cache to store file contents. When the cache is full,
+     * the least recently accessed files are automatically removed to make space.
+     *
+     * @param filePath The normalized path to the file (without extension)
+     * @param fileType The type of file (Prompt or Agent)
+     * @returns The raw file content
+     * @throws HumanloopRuntimeError If the file doesn't exist or can't be read
+     */
+    public getFileContent(filePath: string, fileType: SerializableFileType): string {
+        const cacheKey = `${filePath}:${fileType}`;
+
+        // Check if in cache
+        const cachedContent = this.fileContentCache.get(cacheKey);
+        if (cachedContent !== undefined) {
+            log(
+                `Using cached file content for ${filePath}.${fileType}`,
+                "DEBUG",
+                this.verbose,
+            );
+            return cachedContent;
+        }
+
+        // Not in cache, get from filesystem
+        const content = this._getFileContentImplementation(filePath, fileType);
+
+        // Add to cache
+        this.fileContentCache.set(cacheKey, content);
+
+        return content;
+    }
+
+    /**
+     * Clear the LRU cache.
+     */
+    public clearCache(): void {
+        this.fileContentCache.clear();
+    }
+
+    /**
+     * Check if the path is a file by checking for .{fileType} extension for serializable file types.
+     *
+     * Files are identified by having a supported extension (.prompt or .agent).
+     * This method performs case-insensitive comparison and handles whitespace.
+     *
+     * @returns True if the path ends with a supported file extension
+     */
+    public isFile(filePath: string): boolean {
+        const cleanPath = filePath.trim().toLowerCase(); // Convert to lowercase for case-insensitive comparison
+        return Array.from(SERIALIZABLE_FILE_TYPES).some((fileType) =>
+            cleanPath.endsWith(`.${fileType}`),
+        );
+    }
+
+    /**
+     * Save serialized file to local filesystem.
+     */
+    private _saveSerializedFile(
+        serializedContent: string,
+        filePath: string,
+        fileType: SerializableFileType,
+    ): void {
+        try {
+            // Create full path including baseDir prefix
+            const fullPath = path.join(this.baseDir, filePath);
+            const directory = path.dirname(fullPath);
+            const fileName = path.basename(fullPath, path.extname(fullPath));
+
+            // Create directory if it doesn't exist
+            fs.mkdirSync(directory, { recursive: true });
+
+            // Add file type extension
+            const newPath = path.join(directory, `${fileName}.${fileType}`);
+
+            // Write raw file content to file
+            fs.writeFileSync(newPath, serializedContent);
+            log(`Writing ${fileType} ${filePath} to disk`, "DEBUG", this.verbose);
+        } catch (error) {
+            log(`Failed to write ${fileType} ${filePath} to disk: ${error}`, "ERROR");
+            throw error;
+        }
+    }
+
+    /**
+     * Pull a specific file from Humanloop to local filesystem.
+     *
+     * @returns True if the file was successfully pulled, False otherwise (e.g. if the file was not found)
+     */
+    private async _pullFile(filePath: string, environment?: string): Promise<boolean> {
+        try {
+            const file = await this.client.files.retrieveByPath({
+                path: filePath,
+                environment,
+                includeRawFileContent: true,
+            });
+
+            if (!SERIALIZABLE_FILE_TYPES.has(file.type as SerializableFileType)) {
+                log(`Unsupported file type: ${file.type}`, "ERROR");
+                return false;
+            }
+
+            const rawContent = (file as any).rawFileContent;
+            if (!rawContent) {
+                log(`No content found for ${file.type} ${filePath}`, "ERROR");
+                return false;
+            }
+
+            this._saveSerializedFile(
+                rawContent,
+                file.path,
+                file.type as SerializableFileType,
+            );
+            return true;
+        } catch (error) {
+            log(`Failed to pull file ${filePath}: ${error}`, "ERROR");
+            return false;
+        }
+    }
+
+    /**
+     * Sync Prompt and Agent files from Humanloop to local filesystem.
+     *
+     * @returns An array containing two string arrays:
+     * - First array contains paths of successfully pulled files
+     * - Second array contains paths of files that failed to pull.
+     *   Failures can occur due to missing content in the response or errors during local file writing.
+     * @throws HumanloopRuntimeError If there's an error communicating with the API
+     */
+    private async _pullDirectory(
+        dirPath?: string,
+        environment?: string,
+    ): Promise<[string[], string[]]> {
+        const successfulFiles: string[] = [];
+        const failedFiles: string[] = [];
+        let page = 1;
+        let totalPages = 0;
+
+        log(
+            `Fetching files from ${dirPath || "root"} (environment: ${environment || "default"})`,
+            "INFO",
+            this.verbose,
+        );
+
+        while (true) {
+            try {
+                const response = await this.client.files.listFiles({
+                    type: Array.from(SERIALIZABLE_FILE_TYPES),
+                    page,
+                    size: FileSyncer.PAGE_SIZE,
+                    includeRawFileContent: true,
+                    environment,
+                    path: dirPath,
+                });
+
+                // Calculate total pages on first response
+                if (page === 1) {
+                    const actualPageSize = response.size || FileSyncer.PAGE_SIZE;
+                    totalPages = Math.ceil(response.total / actualPageSize);
+                }
+
+                if (response.records.length === 0) {
+                    break;
+                }
+
+                log(
+                    `Reading page ${page}/${totalPages} (${response.records.length} Files)`,
+                    "DEBUG",
+                    this.verbose,
+                );
+
+                // Process each file
+                for (const file of response.records) {
+                    if (
+                        !SERIALIZABLE_FILE_TYPES.has(file.type as SerializableFileType)
+                    ) {
+                        log(`Skipping unsupported file type: ${file.type}`, "WARN");
+                        continue;
+                    }
+
+                    const fileType = file.type as SerializableFileType;
+                    const rawContent = (file as any).rawFileContent;
+                    if (!rawContent) {
+                        log(`No content found for ${file.type} ${file.path}`, "WARN");
+                        failedFiles.push(file.path);
+                        continue;
+                    }
+
+                    try {
+                        this._saveSerializedFile(rawContent, file.path, fileType);
+                        successfulFiles.push(file.path);
+                    } catch (error) {
+                        failedFiles.push(file.path);
+                        log(`Failed to save ${file.path}: ${error}`, "ERROR");
+                    }
+                }
+
+                // Check if we've reached the last page
+                if (page >= totalPages) {
+                    break;
+                }
+                page += 1;
+            } catch (error) {
+                const formattedError = formatApiError(error as Error, this.verbose);
+                throw new HumanloopRuntimeError(
+                    `Failed to fetch page ${page}: ${formattedError}`,
+                );
+            }
+        }
+
+        if (failedFiles.length > 0) {
+            log(`Failed to pull ${failedFiles.length} files`, "WARN");
+        }
+
+        return [successfulFiles, failedFiles];
+    }
+
+    /**
+     * Pull files from Humanloop to local filesystem.
+     *
+     * If the path ends with `.prompt` or `.agent`, pulls that specific file.
+     * Otherwise, pulls all files under the specified path.
+     * If no path is provided, pulls all files from the root.
+     *
+     * @param filePath The path to pull from. Can be:
+     * - A specific file with extension (e.g. "path/to/file.prompt")
+     * - A directory without extension (e.g. "path/to/directory")
+     * - None to pull all files from root
+     *
+     * Paths should not contain leading or trailing slashes
+     * @param environment The environment to pull from
+     * @returns An array containing two string arrays:
+     * - First array contains paths of successfully pulled files
+     * - Second array contains paths of files that failed to pull (e.g. failed to write to disk or missing raw content)
+     * @throws HumanloopRuntimeError If there's an error communicating with the API
+     */
+    public async pull(
+        filePath?: string,
+        environment?: string,
+    ): Promise<[string[], string[]]> {
+        const startTime = Date.now();
+
+        let apiPath: string | undefined;
+        let isFilePath: boolean;
+
+        if (filePath === undefined) {
+            apiPath = undefined;
+            isFilePath = false;
+        } else {
+            filePath = filePath.trim();
+            // Check if path has leading/trailing slashes
+            if (filePath !== filePath.trim().replace(/^\/+|\/+$/g, "")) {
+                throw new HumanloopRuntimeError(
+                    `Invalid path: ${filePath}. Path should not contain leading/trailing slashes. ` +
+                        `Valid examples: "path/to/file.prompt" or "path/to/directory"`,
+                );
+            }
+
+            // Check if it's a file path (has extension)
+            isFilePath = this.isFile(filePath);
+
+            // For API communication, we need path without extension
+            apiPath = pathUtils.normalizePath(filePath, true);
+        }
+
+        try {
+            let successfulFiles: string[];
+            let failedFiles: string[];
+
+            if (apiPath === undefined) {
+                [successfulFiles, failedFiles] = await this._pullDirectory(
+                    undefined,
+                    environment,
+                );
+            } else {
+                if (isFilePath) {
+                    if (await this._pullFile(apiPath, environment)) {
+                        successfulFiles = [apiPath];
+                        failedFiles = [];
+                    } else {
+                        successfulFiles = [];
+                        failedFiles = [apiPath];
+                    }
+                } else {
+                    [successfulFiles, failedFiles] = await this._pullDirectory(
+                        apiPath,
+                        environment,
+                    );
+                }
+            }
+
+            // Clear the cache at the end of each pull operation
+            this.clearCache();
+
+            const duration = Date.now() - startTime;
+            log(
+                `Successfully pulled ${successfulFiles.length} files in ${duration}ms`,
+                "INFO",
+                this.verbose,
+            );
+
+            return [successfulFiles, failedFiles];
+        } catch (error) {
+            throw new HumanloopRuntimeError(`Pull operation failed: ${error}`);
+        }
+    }
+}
diff --git a/src/sync/index.ts b/src/sync/index.ts
new file mode 100644
index 00000000..bf310919
--- /dev/null
+++ b/src/sync/index.ts
@@ -0,0 +1,7 @@
+/**
+ * File synchronization for Humanloop
+ * 
+ * This module provides sync functionality between Humanloop and the local filesystem.
+ */
+
+export { default as FileSyncer, FileSyncerOptions } from './FileSyncer';
\ No newline at end of file
diff --git a/tests/custom.test.ts b/tests/custom.test.ts
deleted file mode 100644
index 7f5e031c..00000000
--- a/tests/custom.test.ts
+++ /dev/null
@@ -1,13 +0,0 @@
-/**
- * This is a custom test file, if you wish to add more tests
- * to your SDK.
- * Be sure to mark this file in `.fernignore`.
- *
- * If you include example requests/responses in your fern definition,
- * you will have tests automatically generated for you.
- */
-describe("test", () => {
-    it("default", () => {
-        expect(true).toBe(true);
-    });
-});
diff --git a/tests/custom/FileSyncer.test.ts b/tests/custom/FileSyncer.test.ts
new file mode 100644
index 00000000..ed003c95
--- /dev/null
+++ b/tests/custom/FileSyncer.test.ts
@@ -0,0 +1,364 @@
+import * as fs from "fs";
+import * as path from "path";
+import { v4 as uuidv4 } from "uuid";
+
+import { HumanloopRuntimeError } from "../../src/error";
+import FileSyncer, {
+    SERIALIZABLE_FILE_TYPES,
+    SerializableFileType,
+} from "../../src/sync/FileSyncer";
+
+// Mock for HumanloopClient
+class MockHumanloopClient {
+    files = {
+        retrieveByPath: jest.fn(),
+        listFiles: jest.fn(),
+    };
+}
+
+describe("FileSyncer", () => {
+    let mockClient: MockHumanloopClient;
+    let fileSyncer: FileSyncer;
+    let tempDir: string;
+
+    beforeEach(() => {
+        mockClient = new MockHumanloopClient();
+        tempDir = path.join(process.cwd(), "test-tmp", uuidv4());
+
+        // Create temporary directory
+        fs.mkdirSync(tempDir, { recursive: true });
+
+        fileSyncer = new FileSyncer(mockClient as any, {
+            baseDir: tempDir,
+            cacheSize: 10,
+            verbose: true, // Enable verbose logging for tests
+        });
+    });
+
+    afterEach(() => {
+        // Clean up temporary files
+        if (fs.existsSync(tempDir)) {
+            fs.rmSync(tempDir, { recursive: true, force: true });
+        }
+
+        // Clear all mocks
+        jest.clearAllMocks();
+    });
+
+    describe("initialization", () => {
+        it("should initialize with correct base directory, cache size and file types", () => {
+            // Check that the FileSyncer is initialized with the correct properties
+            expect(fileSyncer["baseDir"]).toBe(tempDir);
+            expect(fileSyncer["cacheSize"]).toBe(10);
+            expect(SERIALIZABLE_FILE_TYPES).toEqual(new Set(["prompt", "agent"]));
+        });
+    });
+
+    describe("isFile", () => {
+        it("should correctly identify prompt and agent files with case insensitivity", () => {
+            // Standard lowercase extensions
+            expect(fileSyncer.isFile("test.prompt")).toBe(true);
+            expect(fileSyncer.isFile("test.agent")).toBe(true);
+
+            // Uppercase extensions (case insensitivity)
+            expect(fileSyncer.isFile("test.PROMPT")).toBe(true);
+            expect(fileSyncer.isFile("test.AGENT")).toBe(true);
+            expect(fileSyncer.isFile("test.Prompt")).toBe(true);
+            expect(fileSyncer.isFile("test.Agent")).toBe(true);
+
+            // With whitespace
+            expect(fileSyncer.isFile(" test.prompt ")).toBe(true);
+            expect(fileSyncer.isFile(" test.agent ")).toBe(true);
+        });
+
+        it("should return false for invalid or missing extensions", () => {
+            // Invalid file types
+            expect(fileSyncer.isFile("test.txt")).toBe(false);
+            expect(fileSyncer.isFile("test.json")).toBe(false);
+            expect(fileSyncer.isFile("test.py")).toBe(false);
+
+            // No extension
+            expect(fileSyncer.isFile("test")).toBe(false);
+            expect(fileSyncer.isFile("prompt")).toBe(false);
+            expect(fileSyncer.isFile("agent")).toBe(false);
+
+            // Partial extensions
+            expect(fileSyncer.isFile("test.prom")).toBe(false);
+            expect(fileSyncer.isFile("test.age")).toBe(false);
+        });
+    });
+
+    describe("file operations", () => {
+        it("should save and read files correctly", () => {
+            // Given a file content and path
+            const content = "test content";
+            const filePath = "test/path";
+            const fileType: SerializableFileType = "prompt";
+
+            // When saving the file
+            fileSyncer["_saveSerializedFile"](content, filePath, fileType);
+
+            // Then the file should exist on disk
+            const savedPath = path.join(tempDir, filePath + "." + fileType);
+            expect(fs.existsSync(savedPath)).toBe(true);
+
+            // When reading the file
+            const readContent = fileSyncer.getFileContent(filePath, fileType);
+
+            // Then the content should match
+            expect(readContent).toBe(content);
+        });
+
+        it("should throw an error when reading a nonexistent file", () => {
+            // When trying to read a nonexistent file
+            // Then a HumanloopRuntimeError should be raised
+            expect(() => {
+                fileSyncer.getFileContent("nonexistent", "prompt");
+            }).toThrow(HumanloopRuntimeError);
+
+            // Check that the error message contains expected text
+            expect(() => {
+                fileSyncer.getFileContent("nonexistent", "prompt");
+            }).toThrow(/Failed to read/);
+        });
+
+        it("should return false when API calls fail during pull", async () => {
+            // Given an API error
+            mockClient.files.retrieveByPath.mockRejectedValue(new Error("API Error"));
+
+            // When trying to pull a file
+            const result = await fileSyncer["_pullFile"]("test.prompt");
+
+            // Then it should return false
+            expect(result).toBe(false);
+
+            // And the API method should have been called
+            expect(mockClient.files.retrieveByPath).toHaveBeenCalled();
+        });
+    });
+
+    describe("cache functionality", () => {
+        it("should cache file content and respect cache invalidation", () => {
+            // Given a test file
+            const content = "test content";
+            const filePath = "test/path";
+            const fileType: SerializableFileType = "prompt";
+            fileSyncer["_saveSerializedFile"](content, filePath, fileType);
+
+            // When reading the file for the first time
+            const firstRead = fileSyncer.getFileContent(filePath, fileType);
+            expect(firstRead).toBe(content);
+
+            // When modifying the file on disk
+            const savedPath = path.join(tempDir, filePath + "." + fileType);
+            fs.writeFileSync(savedPath, "modified content");
+
+            // Then subsequent reads should use cache (and return the original content)
+            const secondRead = fileSyncer.getFileContent(filePath, fileType);
+            expect(secondRead).toBe(content); // Should return cached content, not modified
+
+            // When clearing the cache
+            fileSyncer.clearCache();
+
+            // Then new content should be read from disk
+            const thirdRead = fileSyncer.getFileContent(filePath, fileType);
+            expect(thirdRead).toBe("modified content");
+        });
+
+        it("should respect the cache size limit", () => {
+            // Create a file syncer with small cache
+            const smallCacheFileSyncer = new FileSyncer(mockClient as any, {
+                baseDir: tempDir,
+                cacheSize: 2, // Only 2 items in cache
+            });
+
+            // Save 3 different files
+            for (let i = 1; i <= 3; i++) {
+                const content = `content ${i}`;
+                const filePath = `test/path${i}`;
+                const fileType: SerializableFileType = "prompt";
+                smallCacheFileSyncer["_saveSerializedFile"](
+                    content,
+                    filePath,
+                    fileType,
+                );
+
+                // Read to put in cache
+                smallCacheFileSyncer.getFileContent(filePath, fileType);
+            }
+
+            // Modify the first file (which should have been evicted from cache)
+            const firstPath = "test/path1";
+            const savedPath = path.join(tempDir, firstPath + ".prompt");
+            fs.writeFileSync(savedPath, "modified content");
+
+            // Reading the first file should get the modified content (not cached)
+            const newContent = smallCacheFileSyncer.getFileContent(firstPath, "prompt");
+            expect(newContent).toBe("modified content");
+
+            // But reading the 2nd and 3rd files should still use cache
+            expect(smallCacheFileSyncer.getFileContent("test/path2", "prompt")).toBe(
+                "content 2",
+            );
+            expect(smallCacheFileSyncer.getFileContent("test/path3", "prompt")).toBe(
+                "content 3",
+            );
+        });
+    });
+
+    describe("pull operations", () => {
+        it("should handle successful file pull", async () => {
+            // Mock successful file pull response
+            mockClient.files.retrieveByPath.mockResolvedValue({
+                type: "prompt",
+                path: "test/path",
+                rawFileContent: "pulled content",
+            });
+
+            // When pulling a file
+            const result = await fileSyncer["_pullFile"]("test/path");
+
+            // Then it should return true
+            expect(result).toBe(true);
+
+            // And the file should be saved to disk
+            const savedPath = path.join(tempDir, "test/path.prompt");
+            expect(fs.existsSync(savedPath)).toBe(true);
+            expect(fs.readFileSync(savedPath, "utf8")).toBe("pulled content");
+        });
+
+        it("should handle unsuccessful file pull due to missing content", async () => {
+            // Mock response with missing content
+            mockClient.files.retrieveByPath.mockResolvedValue({
+                type: "prompt",
+                path: "test/path",
+                // missing rawFileContent
+            });
+
+            // When pulling a file
+            const result = await fileSyncer["_pullFile"]("test/path");
+
+            // Then it should return false
+            expect(result).toBe(false);
+        });
+
+        it("should handle unsuccessful file pull due to unsupported type", async () => {
+            // Mock response with unsupported type
+            mockClient.files.retrieveByPath.mockResolvedValue({
+                type: "dataset", // Not a serializable type
+                path: "test/path",
+                rawFileContent: "content",
+            });
+
+            // When pulling a file
+            const result = await fileSyncer["_pullFile"]("test/path");
+
+            // Then it should return false
+            expect(result).toBe(false);
+        });
+
+        it("should pull a directory of files", async () => {
+            // Mock directory listing responses (paginated)
+            mockClient.files.listFiles.mockResolvedValueOnce({
+                records: [
+                    {
+                        type: "prompt",
+                        path: "dir/file1",
+                        rawFileContent: "content 1",
+                    },
+                    {
+                        type: "agent",
+                        path: "dir/file2",
+                        rawFileContent: "content 2",
+                    },
+                ],
+                page: 1,
+                size: 2,
+                total: 3,
+            });
+
+            mockClient.files.listFiles.mockResolvedValueOnce({
+                records: [
+                    {
+                        type: "prompt",
+                        path: "dir/file3",
+                        rawFileContent: "content 3",
+                    },
+                ],
+                page: 2,
+                size: 2,
+                total: 3,
+            });
+
+            // When pulling a directory
+            const [successful, failed] = await fileSyncer["_pullDirectory"]("dir");
+
+            // Then it should succeed for all files
+            expect(successful.length).toBe(3);
+            expect(failed.length).toBe(0);
+
+            // And all files should exist on disk
+            expect(fs.existsSync(path.join(tempDir, "dir/file1.prompt"))).toBe(true);
+            expect(fs.existsSync(path.join(tempDir, "dir/file2.agent"))).toBe(true);
+            expect(fs.existsSync(path.join(tempDir, "dir/file3.prompt"))).toBe(true);
+        });
+
+        it("should handle the main pull method with different path types", async () => {
+            // Mock methods that are called by pull
+            jest.spyOn(fileSyncer, "isFile").mockImplementation((p) =>
+                p.endsWith(".prompt"),
+            );
+            jest.spyOn(fileSyncer as any, "_pullFile").mockResolvedValue(true);
+            jest.spyOn(fileSyncer as any, "_pullDirectory").mockResolvedValue([
+                ["dir/file1"],
+                [],
+            ]);
+
+            // Test with file path
+            await fileSyncer.pull("test/path.prompt");
+            expect(fileSyncer["_pullFile"]).toHaveBeenCalledWith(
+                "test/path",
+                undefined,
+            );
+
+            // Reset mocks
+            jest.clearAllMocks();
+
+            // Test with directory path
+            await fileSyncer.pull("test/dir");
+            expect(fileSyncer["_pullDirectory"]).toHaveBeenCalledWith(
+                "test/dir",
+                undefined,
+            );
+
+            // Reset mocks
+            jest.clearAllMocks();
+
+            // Test with no path (root)
+            await fileSyncer.pull();
+            expect(fileSyncer["_pullDirectory"]).toHaveBeenCalledWith(
+                undefined,
+                undefined,
+            );
+
+            // Test with environment parameter
+            await fileSyncer.pull("test/path.prompt", "staging");
+            expect(fileSyncer["_pullFile"]).toHaveBeenCalledWith(
+                "test/path",
+                "staging",
+            );
+        });
+
+        it("should reject paths with leading or trailing slashes", async () => {
+            // Test with leading slash
+            await expect(fileSyncer.pull("/test/path")).rejects.toThrow(
+                HumanloopRuntimeError,
+            );
+
+            // Test with trailing slash
+            await expect(fileSyncer.pull("test/path/")).rejects.toThrow(
+                HumanloopRuntimeError,
+            );
+        });
+    });
+});
diff --git a/tests/custom/fixtures.ts b/tests/custom/fixtures.ts
new file mode 100644
index 00000000..9909abc4
--- /dev/null
+++ b/tests/custom/fixtures.ts
@@ -0,0 +1,21 @@
+import * as fs from "fs";
+import * as path from "path";
+import { v4 as uuidv4 } from "uuid";
+
+/**
+ * Creates a temporary directory for tests
+ * @param prefix Optional prefix for the directory name
+ * @returns Path to the created directory and a cleanup function
+ */
+export function createTempDir(prefix = "test") {
+    const tempDir = path.join(process.cwd(), "test-tmp", `${prefix}-${uuidv4()}`);
+    fs.mkdirSync(tempDir, { recursive: true });
+
+    const cleanup = () => {
+        if (fs.existsSync(tempDir)) {
+            fs.rmSync(tempDir, { recursive: true, force: true });
+        }
+    };
+
+    return { tempDir, cleanup };
+}
diff --git a/tests/custom/integration/FileSyncer.test.ts b/tests/custom/integration/FileSyncer.test.ts
new file mode 100644
index 00000000..7afa1ab2
--- /dev/null
+++ b/tests/custom/integration/FileSyncer.test.ts
@@ -0,0 +1,160 @@
+import * as fs from "fs";
+import * as path from "path";
+import { v4 as uuidv4 } from "uuid";
+
+import { FileType } from "../../../src/api";
+import { HumanloopRuntimeError } from "../../../src/error";
+import { HumanloopClient } from "../../../src/humanloop.client";
+import { createTempDir } from "../fixtures";
+import {
+    SyncableFile,
+    TestSetup,
+    cleanupTestEnvironment,
+    createSyncableFilesFixture,
+    setupTestEnvironment,
+} from "./fixtures";
+
+describe("FileSyncer Integration Tests", () => {
+    let testSetup: TestSetup;
+    let syncableFiles: SyncableFile[] = [];
+    let tempDirInfo: { tempDir: string; cleanup: () => void };
+
+    beforeAll(async () => {
+        // Set up test environment
+        testSetup = await setupTestEnvironment("file_sync");
+        tempDirInfo = createTempDir("file-sync-integration");
+
+        // Create test files in Humanloop for syncing
+        syncableFiles = await createSyncableFilesFixture(testSetup);
+    });
+
+    afterAll(async () => {
+        // Clean up resources only if they were created
+        if (tempDirInfo) {
+            tempDirInfo.cleanup();
+        }
+        if (testSetup) {
+            await cleanupTestEnvironment(
+                testSetup,
+                syncableFiles.map((file) => ({
+                    type: file.type as FileType,
+                    id: file.id as string,
+                })),
+            );
+        }
+    }, 30000);
+
+    test("pull_basic: should pull all files from remote to local filesystem", async () => {
+        // GIVEN a set of files in the remote system (from syncableFiles)
+        const client = new HumanloopClient({
+            apiKey: process.env.HUMANLOOP_API_KEY,
+            localFilesDirectory: tempDirInfo.tempDir,
+            useLocalFiles: true,
+        });
+
+        // WHEN running the pull operation
+        await client.pull();
+
+        // THEN our local filesystem should mirror the remote filesystem in the HL Workspace
+        for (const file of syncableFiles) {
+            const extension = `.${file.type}`;
+            const localPath = path.join(
+                tempDirInfo.tempDir,
+                `${file.path}${extension}`,
+            );
+
+            // THEN the file and its directory should exist
+            expect(fs.existsSync(localPath)).toBe(true);
+            expect(fs.existsSync(path.dirname(localPath))).toBe(true);
+
+            // THEN the file should not be empty
+            const content = fs.readFileSync(localPath, "utf8");
+            expect(content).toBeTruthy();
+        }
+    }, 30000);
+
+    test("pull_with_invalid_path: should handle error when path doesn't exist", async () => {
+        // GIVEN a client
+        const client = new HumanloopClient({
+            apiKey: process.env.HUMANLOOP_API_KEY,
+            localFilesDirectory: tempDirInfo.tempDir,
+            useLocalFiles: true,
+        });
+
+        const nonExistentPath = `${testSetup.sdkTestDir.path}/non_existent_directory`;
+
+        // WHEN/THEN pulling with an invalid path should throw an error
+        await expect(client.pull(nonExistentPath)).rejects.toThrow(
+            HumanloopRuntimeError,
+        );
+        // The error message might be different in TypeScript, so we don't assert on the exact message
+    });
+
+    test("pull_with_invalid_environment: should handle error when environment doesn't exist", async () => {
+        // GIVEN a client
+        const client = new HumanloopClient({
+            apiKey: process.env.HUMANLOOP_API_KEY,
+            localFilesDirectory: tempDirInfo.tempDir,
+            useLocalFiles: true,
+        });
+
+        // WHEN/THEN pulling with an invalid environment should throw an error
+        await expect(client.pull(undefined, "invalid_environment")).rejects.toThrow(
+            HumanloopRuntimeError,
+        );
+    });
+
+    test("pull_with_path_filter: should only pull files from specified path", async () => {
+        // GIVEN a client and a clean temp directory
+        const pathFilterTempDir = createTempDir("file-sync-path-filter");
+
+        const client = new HumanloopClient({
+            apiKey: process.env.HUMANLOOP_API_KEY,
+            localFilesDirectory: pathFilterTempDir.tempDir,
+            useLocalFiles: true,
+        });
+
+        // WHEN pulling only files from the testSetup.sdkTestDir.path
+        await client.pull(testSetup.sdkTestDir.path);
+
+        // THEN count the total number of files pulled
+        let pulledFileCount = 0;
+
+        // Collect expected file paths (relative to sdkTestDir.path)
+        const expectedFiles = new Set(
+            syncableFiles.map((file) =>
+                path.join(
+                    pathFilterTempDir.tempDir,
+                    file.path + (file.type === "prompt" ? ".prompt" : ".agent"),
+                ),
+            ),
+        );
+
+        const foundFiles = new Set<string>();
+
+        function countFilesRecursive(dirPath: string): void {
+            const entries = fs.readdirSync(dirPath, { withFileTypes: true });
+            for (const entry of entries) {
+                const fullPath = path.join(dirPath, entry.name);
+                if (entry.isDirectory()) {
+                    countFilesRecursive(fullPath);
+                } else if (entry.isFile()) {
+                    if (expectedFiles.has(fullPath)) {
+                        const content = fs.readFileSync(fullPath, "utf8");
+                        expect(content).toBeTruthy();
+                        foundFiles.add(fullPath);
+                    }
+                }
+            }
+        }
+
+        if (fs.existsSync(pathFilterTempDir.tempDir)) {
+            countFilesRecursive(pathFilterTempDir.tempDir);
+        }
+
+        expect(foundFiles.size).toBe(expectedFiles.size);
+
+        // Clean up
+        pathFilterTempDir.cleanup();
+    });
+});
diff --git a/tests/custom/integration/cli.test.ts b/tests/custom/integration/cli.test.ts
new file mode 100644
index 00000000..be710dc4
--- /dev/null
+++ b/tests/custom/integration/cli.test.ts
@@ -0,0 +1,295 @@
+import * as fs from "fs";
+import * as path from "path";
+import { spawn } from "child_process";
+
+import { createTempDir } from "../fixtures";
+import {
+    TestSetup,
+    cleanupTestEnvironment,
+    createSyncableFilesFixture,
+    setupTestEnvironment,
+} from "./fixtures";
+
+// Helper function to run CLI commands with TypeScript
+async function runCli(
+    args: string[],
+): Promise<{ stdout: string; stderr: string; exitCode: number }> {
+    return new Promise((resolve) => {
+        const packageRoot = path.resolve(__dirname, "../../../");
+        const cliPath = path.join(packageRoot, "dist/cli.js");
+
+        // Use spawn to avoid shell interpretation issues
+        const childProcess = spawn("node", [cliPath, ...args], {
+            stdio: ["ignore", "pipe", "pipe"],
+        });
+
+        let stdout = "";
+        let stderr = "";
+
+        childProcess.stdout?.on("data", (data) => {
+            stdout += data.toString();
+        });
+
+        childProcess.stderr?.on("data", (data) => {
+            stderr += data.toString();
+        });
+
+        childProcess.on("close", (code) => {
+            resolve({
+                stdout,
+                stderr,
+                exitCode: code !== null ? code : 0,
+            });
+        });
+    });
+}
+
+describe("CLI Integration Tests", () => {
+    let testSetup: TestSetup;
+    let syncableFiles: any[] = [];
+
+    beforeAll(async () => {
+        // Increase timeout for setup operations
+        jest.setTimeout(40000); // 40 seconds
+
+        // Set up test environment
+        testSetup = await setupTestEnvironment("cli_test");
+
+        // Create test files in Humanloop for syncing
+        syncableFiles = await createSyncableFilesFixture(testSetup);
+    }, 30000);
+
+    afterAll(async () => {
+        await cleanupTestEnvironment(
+            testSetup,
+            syncableFiles.map((file) => ({
+                type: file.type as any,
+                id: file.id as string,
+            })),
+        );
+    }, 30000);
+
+    /**
+     * NOTE: This test is currently skipped due to issues with CLI environment isolation.
+     * 
+     * The test attempts to verify behavior when no API key is available, but faces 
+     * challenges with how Node.js handles process execution during tests:
+     * 
+     * 1. When executed via child_process.exec, the path to nonexistent env files 
+     *    causes Node to return exit code 9 (SIGKILL) instead of the expected code 1
+     * 2. Shell interpretation of arguments makes it difficult to reliably test this edge case
+     * 
+     * If this functionality needs testing, consider:
+     * - Using child_process.spawn for better argument handling
+     * - Unit testing the API key validation logic directly
+     * - Moving this test to a separate process with full environment isolation
+     * 
+     * @see https://nodejs.org/api/child_process.html for more info on process execution
+    */
+    test.skip("pull_without_api_key: should show error when no API key is available", async () => {
+        // GIVEN a temporary directory and no API key
+        const { tempDir, cleanup } = createTempDir("cli-no-api-key");
+
+        // Create a path to a file that definitely doesn't exist
+        const nonExistentEnvFile = path.join(tempDir, "__DOES_NOT_EXIST__.env");
+
+        // WHEN running pull command without API key
+        const originalApiKey = process.env.HUMANLOOP_API_KEY;
+        delete process.env.HUMANLOOP_API_KEY;
+
+        const result = await runCli([
+            "pull",
+            "--local-files-directory",
+            tempDir,
+            "--env-file",
+            `"${nonExistentEnvFile}"`,
+        ]);
+
+        // Restore API key
+        process.env.HUMANLOOP_API_KEY = originalApiKey;
+
+        // THEN it should fail with appropriate error message
+        expect(result.exitCode).not.toBe(0);
+        expect(result.stderr + result.stdout).toContain(
+            "Failed to load environment file",
+        );
+
+        cleanup();
+    });
+
+    test("pull_basic: should pull all files successfully", async () => {
+        // Increase timeout for this test
+        jest.setTimeout(30000); // 30 seconds
+
+        // GIVEN a base directory for pulled files
+        const { tempDir, cleanup } = createTempDir("cli-basic-pull");
+
+        // WHEN running pull command
+        const result = await runCli([
+            "pull",
+            "--local-files-directory",
+            tempDir,
+            "--verbose",
+            "--api-key",
+            process.env.HUMANLOOP_API_KEY || "",
+        ]);
+
+        // THEN it should succeed
+        expect(result.exitCode).toBe(0);
+        expect(result.stdout).toContain("Pulling files from Humanloop");
+        expect(result.stdout).toContain("Pull completed");
+
+        // THEN the files should exist locally
+        for (const file of syncableFiles) {
+            const extension = `.${file.type}`;
+            const localPath = path.join(tempDir, `${file.path}${extension}`);
+
+            expect(fs.existsSync(localPath)).toBe(true);
+            expect(fs.existsSync(path.dirname(localPath))).toBe(true);
+
+            const content = fs.readFileSync(localPath, "utf8");
+            expect(content).toBeTruthy();
+        }
+
+        cleanup();
+    }, 30000);
+
+    test("pull_with_specific_path: should pull files from a specific path", async () => {
+        // GIVEN a base directory and specific path
+        const { tempDir, cleanup } = createTempDir("cli-path-pull");
+
+        // Get the prefix of the first file's path (test directory)
+        const testPath = syncableFiles[0].path.split("/")[0];
+
+        // WHEN running pull command with path
+        const result = await runCli([
+            "pull",
+            "--local-files-directory",
+            tempDir,
+            "--path",
+            testPath,
+            "--verbose",
+            "--api-key",
+            process.env.HUMANLOOP_API_KEY || "",
+        ]);
+
+        // THEN it should succeed and show the path
+        expect(result.exitCode).toBe(0);
+        expect(result.stdout).toContain(`Path: ${testPath}`);
+
+        // THEN only files from that path should exist locally
+        for (const file of syncableFiles) {
+            const extension = `.${file.type}`;
+            const localPath = path.join(tempDir, `${file.path}${extension}`);
+
+            if (file.path.startsWith(testPath)) {
+                expect(fs.existsSync(localPath)).toBe(true);
+            } else {
+                expect(fs.existsSync(localPath)).toBe(false);
+            }
+        }
+
+        cleanup();
+    });
+
+    test("pull_with_environment: should pull files from a specific environment", async () => {
+        // Increase timeout for this test
+        jest.setTimeout(30000); // 30 seconds
+
+        // GIVEN a base directory and environment
+        const { tempDir, cleanup } = createTempDir("cli-env-pull");
+
+        // WHEN running pull command with environment
+        const result = await runCli([
+            "pull",
+            "--local-files-directory",
+            tempDir,
+            "--environment",
+            "staging",
+            "--verbose",
+            "--api-key",
+            process.env.HUMANLOOP_API_KEY || "",
+        ]);
+
+        // THEN it should succeed and show the environment
+        expect(result.exitCode).toBe(0);
+        expect(result.stdout).toContain("Environment: staging");
+
+        cleanup();
+    }, 30000);
+
+    test("pull_with_quiet_mode: should pull files with quiet mode enabled", async () => {
+        // GIVEN a base directory and quiet mode
+        const { tempDir, cleanup } = createTempDir("cli-quiet-pull");
+
+        // WHEN running pull command with quiet mode
+        const result = await runCli([
+            "pull",
+            "--local-files-directory",
+            tempDir,
+            "--quiet",
+            "--api-key",
+            process.env.HUMANLOOP_API_KEY || "",
+        ]);
+
+        // THEN it should succeed but not show file list
+        expect(result.exitCode).toBe(0);
+        expect(result.stdout).not.toContain("Successfully pulled");
+
+        // THEN files should still be pulled
+        for (const file of syncableFiles) {
+            const extension = `.${file.type}`;
+            const localPath = path.join(tempDir, `${file.path}${extension}`);
+            expect(fs.existsSync(localPath)).toBe(true);
+        }
+
+        cleanup();
+    });
+
+    test("pull_with_invalid_path: should handle error when pulling from an invalid path", async () => {
+        // GIVEN an invalid path
+        const { tempDir, cleanup } = createTempDir("cli-invalid-path");
+        const path = "nonexistent/path";
+
+        // WHEN running pull command
+        const result = await runCli([
+            "pull",
+            "--local-files-directory",
+            tempDir,
+            "--path",
+            path,
+            "--api-key",
+            process.env.HUMANLOOP_API_KEY || "",
+        ]);
+
+        // THEN it should fail
+        expect(result.exitCode).toBe(1);
+        expect(result.stderr + result.stdout).toContain("Error");
+
+        cleanup();
+    });
+
+    test("pull_with_invalid_environment: should handle error when pulling from an invalid environment", async () => {
+        // GIVEN an invalid environment
+        const { tempDir, cleanup } = createTempDir("cli-invalid-env");
+        const environment = "nonexistent";
+
+        // WHEN running pull command
+        const result = await runCli([
+            "pull",
+            "--local-files-directory",
+            tempDir,
+            "--environment",
+            environment,
+            "--verbose",
+            "--api-key",
+            process.env.HUMANLOOP_API_KEY || "",
+        ]);
+
+        // THEN it should fail
+        expect(result.exitCode).toBe(1);
+        expect(result.stderr + result.stdout).toContain("Error");
+
+        cleanup();
+    });
+});
diff --git a/tests/custom/integration/decorators.test.ts b/tests/custom/integration/decorators.test.ts
new file mode 100644
index 00000000..ef9e22a0
--- /dev/null
+++ b/tests/custom/integration/decorators.test.ts
@@ -0,0 +1,502 @@
+import OpenAI from "openai";
+
+import { PromptRequest } from "../../../src/api";
+import { HumanloopRuntimeError } from "../../../src/error";
+import {
+    CleanupResources,
+    TestPrompt,
+    TestSetup,
+    cleanupTestEnvironment,
+    setupTestEnvironment,
+} from "./fixtures";
+
+// Long timeout per test
+jest.setTimeout(30 * 1000);
+
+// process.stdout.moveCursor is undefined in jest; mocking it since STDOUT is not relevant
+if (typeof process.stdout.moveCursor !== "function") {
+    process.stdout.moveCursor = (
+        dx: number,
+        dy: number,
+        callback?: () => void,
+    ): boolean => {
+        if (callback) callback();
+        return true;
+    };
+}
+
+/**
+ * Creates a test prompt in the specified test environment
+ */
+async function createTestPrompt(
+    setup: TestSetup,
+    name: string = "test_prompt",
+    customConfig?: Partial<PromptRequest>,
+): Promise<TestPrompt> {
+    const promptPath = `${setup.sdkTestDir.path}/${name}`;
+    const config = customConfig
+        ? { ...setup.testPromptConfig, ...customConfig }
+        : setup.testPromptConfig;
+
+    const promptResponse = await setup.humanloopClient.prompts.upsert({
+        path: promptPath,
+        ...config,
+    });
+
+    return {
+        id: promptResponse.id,
+        path: promptPath,
+        response: promptResponse,
+    };
+}
+
+/**
+ * Creates a base function for LLM calls that can be decorated
+ */
+function createBaseLLMFunction(setup: TestSetup, model: string = "gpt-4o-mini") {
+    return async (question: string): Promise<string> => {
+        const openaiClient = new OpenAI({ apiKey: setup.openaiApiKey });
+
+        const response = await openaiClient.chat.completions.create({
+            model: model,
+            messages: [{ role: "user", content: question }],
+        });
+
+        return response.choices[0].message.content || "";
+    };
+}
+
+/**
+ * Applies the prompt decorator to a function and tests it
+ */
+async function testPromptDecorator(
+    setup: TestSetup,
+    prompt: TestPrompt,
+    input: string = "What is the capital of the France?",
+    expectedSubstring: string = "paris",
+): Promise<void> {
+    // Create the base function
+    const myPromptBase = createBaseLLMFunction(setup);
+
+    // Apply the higher-order function instead of decorator
+    const myPrompt = setup.humanloopClient.prompt({
+        path: prompt.path,
+        callable: myPromptBase,
+    });
+
+    // Call the decorated function
+    const result = await myPrompt(input);
+    if (result) {
+        expect(result.toLowerCase()).toContain(expectedSubstring.toLowerCase());
+    } else {
+        throw new Error("Expected result to be defined");
+    }
+
+    // Wait for 5 seconds for the log to be created
+    await new Promise((resolve) => setTimeout(resolve, 5000));
+}
+
+describe("decorators", () => {
+    it("should create a prompt log when using the decorator", async () => {
+        let testSetup: TestSetup | undefined = undefined;
+        let testPrompt: TestPrompt | undefined = undefined;
+
+        try {
+            testSetup = await setupTestEnvironment("test_prompt_call_decorator");
+            // Create test prompt
+            testPrompt = await createTestPrompt(testSetup);
+
+            // Check initial version count
+            const promptVersionsResponse =
+                await testSetup.humanloopClient.prompts.listVersions(testPrompt.id);
+            expect(promptVersionsResponse.records.length).toBe(1);
+
+            // Test the prompt decorator
+            await testPromptDecorator(testSetup, testPrompt);
+
+            // Verify a new version was created
+            const updatedPromptVersionsResponse =
+                await testSetup.humanloopClient.prompts.listVersions(testPrompt.id);
+            expect(updatedPromptVersionsResponse.records.length).toBe(2);
+
+            // Verify logs were created
+            const logsResponse = await testSetup.humanloopClient.logs.list({
+                fileId: testPrompt.id,
+                page: 1,
+                size: 50,
+            });
+            expect(logsResponse.data.length).toBe(1);
+        } catch (error) {
+            // Make sure to clean up if the test fails
+            const cleanupResources: CleanupResources[] = [];
+            if (testPrompt) {
+                cleanupResources.push({
+                    type: "prompt",
+                    id: testPrompt.id,
+                });
+            }
+            if (testSetup) {
+                await cleanupTestEnvironment(testSetup, cleanupResources);
+            }
+            throw error;
+        }
+    });
+
+    it("should create logs with proper tracing when using prompt in flow decorator", async () => {
+        let testSetup: TestSetup | undefined = undefined;
+        let flowId: string | null = null;
+        let promptId: string | null = null;
+
+        try {
+            // Create test flow and prompt paths
+            testSetup = await setupTestEnvironment("test_flow_decorator");
+            const flowPath = `${testSetup.sdkTestDir.path}/test_flow`;
+            const promptPath = `${testSetup.sdkTestDir.path}/test_prompt`;
+
+            // Create the prompt
+            const promptResponse = await testSetup.humanloopClient.prompts.upsert({
+                path: promptPath,
+                provider: "openai",
+                model: "gpt-4o-mini",
+                temperature: 0,
+            });
+            const promptId = promptResponse.id;
+
+            // Define the flow callable function with the correct type signature
+            const flowCallable = async (question: {
+                question: string;
+            }): Promise<string> => {
+                const response = await testSetup!.humanloopClient.prompts.call({
+                    path: promptPath,
+                    messages: [{ role: "user", content: question.question }],
+                    providerApiKeys: { openai: testSetup!.openaiApiKey },
+                });
+
+                const output = response.logs?.[0]?.output;
+                expect(output).not.toBeNull();
+                return output || "";
+            };
+
+            // Apply the flow decorator
+            const myFlow = testSetup.humanloopClient.flow({
+                path: flowPath,
+                callable: flowCallable,
+            });
+
+            // Call the flow with the expected input format
+            const result = await myFlow({
+                question: "What is the capital of the France?",
+            });
+            expect(result?.toLowerCase()).toContain("paris");
+
+            // Wait for logs to be created
+            await new Promise((resolve) => setTimeout(resolve, 5000));
+
+            // Verify prompt logs
+            const promptRetrieveResponse =
+                await testSetup.humanloopClient.files.retrieveByPath({
+                    path: promptPath,
+                });
+            expect(promptRetrieveResponse).not.toBeNull();
+            const promptLogsResponse = await testSetup.humanloopClient.logs.list({
+                fileId: promptRetrieveResponse.id,
+                page: 1,
+                size: 50,
+            });
+            expect(promptLogsResponse.data.length).toBe(1);
+            const promptLog = promptLogsResponse.data[0];
+
+            // Verify flow logs
+            const flowRetrieveResponse =
+                await testSetup.humanloopClient.files.retrieveByPath({
+                    path: flowPath,
+                });
+            expect(flowRetrieveResponse).not.toBeNull();
+            flowId = flowRetrieveResponse.id;
+            const flowLogsResponse = await testSetup.humanloopClient.logs.list({
+                fileId: flowRetrieveResponse.id,
+                page: 1,
+                size: 50,
+            });
+            expect(flowLogsResponse.data.length).toBe(1);
+            const flowLog = flowLogsResponse.data[0];
+
+            // Verify tracing between logs
+            expect(promptLog.traceParentId).toBe(flowLog.id);
+        } finally {
+            // Clean up resources
+            const cleanupResources: CleanupResources[] = [];
+            if (flowId) {
+                cleanupResources.push({
+                    type: "flow",
+                    id: flowId,
+                });
+            }
+            if (promptId) {
+                cleanupResources.push({
+                    type: "prompt",
+                    id: promptId,
+                });
+            }
+            if (testSetup) {
+                await cleanupTestEnvironment(testSetup, cleanupResources);
+            }
+        }
+    });
+
+    it("should log exceptions when using the flow decorator", async () => {
+        let testSetup: TestSetup | undefined = undefined;
+        let flowId: string | null = null;
+
+        try {
+            // Create test flow path
+            testSetup = await setupTestEnvironment("test_flow_decorator");
+            const flowPath = `${testSetup.sdkTestDir.path}/test_flow_log_error`;
+
+            // Define a flow callable that throws an error
+            const flowCallable = async ({
+                question,
+            }: {
+                question: string;
+            }): Promise<string> => {
+                throw new Error("This is a test exception");
+            };
+
+            // Apply the flow decorator
+            const myFlow = testSetup.humanloopClient.flow({
+                path: flowPath,
+                callable: flowCallable,
+            });
+
+            // Call the flow and expect it to throw
+            try {
+                await myFlow({ question: "test" });
+                // If we get here, the test should fail
+                throw new Error("Expected flow to throw an error but it didn't");
+            } catch (error) {
+                // Expected error
+                expect(error).toBeDefined();
+            }
+
+            // Wait for logs to be created
+            await new Promise((resolve) => setTimeout(resolve, 5000));
+
+            // Verify flow logs
+            const flowRetrieveResponse =
+                await testSetup.humanloopClient.files.retrieveByPath({
+                    path: flowPath,
+                });
+            expect(flowRetrieveResponse).not.toBeNull();
+            flowId = flowRetrieveResponse.id;
+
+            const flowLogsResponse = await testSetup.humanloopClient.logs.list({
+                fileId: flowRetrieveResponse.id,
+                page: 1,
+                size: 50,
+            });
+            expect(flowLogsResponse.data.length).toBe(1);
+
+            const flowLog = flowLogsResponse.data[0];
+            expect(flowLog.error).not.toBeUndefined();
+            expect(flowLog.output).toBeUndefined();
+        } finally {
+            if (testSetup) {
+                await cleanupTestEnvironment(
+                    testSetup,
+                    flowId
+                        ? [
+                              {
+                                  type: "flow",
+                                  id: flowId,
+                              },
+                          ]
+                        : [],
+                );
+            }
+        }
+    });
+
+    it("should populate outputMessage when flow returns chat message format", async () => {
+        let testSetup: TestSetup | undefined = undefined;
+        let flowId: string | null = null;
+
+        try {
+            // Create test flow path
+            testSetup = await setupTestEnvironment("test_flow_decorator");
+            const flowPath = `${testSetup.sdkTestDir.path}/test_flow_log_output_message`;
+
+            // Define a flow callable that returns a chat message format
+            const flowCallable = async ({ question }: { question: string }) => {
+                return {
+                    role: "user",
+                    content: question,
+                };
+            };
+
+            // Apply the flow decorator
+            const myFlow = testSetup.humanloopClient.flow({
+                path: flowPath,
+                callable: flowCallable,
+            });
+
+            // Call the flow and check the returned message
+            const result = await myFlow({
+                question: "What is the capital of the France?",
+            });
+            expect(result?.content.toLowerCase()).toContain("france");
+
+            // Wait for logs to be created
+            await new Promise((resolve) => setTimeout(resolve, 5000));
+
+            // Verify flow logs
+            const flowRetrieveResponse =
+                await testSetup.humanloopClient.files.retrieveByPath({
+                    path: flowPath,
+                });
+            expect(flowRetrieveResponse).not.toBeNull();
+            flowId = flowRetrieveResponse.id;
+
+            const flowLogsResponse = await testSetup.humanloopClient.logs.list({
+                fileId: flowRetrieveResponse.id,
+                page: 1,
+                size: 50,
+            });
+            expect(flowLogsResponse.data.length).toBe(1);
+
+            const flowLog = flowLogsResponse.data[0];
+            expect(flowLog.outputMessage).not.toBeUndefined();
+            expect(flowLog.output).toBeUndefined();
+            expect(flowLog.error).toBeUndefined();
+        } finally {
+            // Clean up resources
+            if (flowId) {
+                await testSetup!.humanloopClient.flows.delete(flowId);
+            }
+            if (testSetup) {
+                await cleanupTestEnvironment(
+                    testSetup,
+                    flowId
+                        ? [
+                              {
+                                  type: "flow",
+                                  id: flowId,
+                              },
+                          ]
+                        : [],
+                );
+            }
+        }
+    });
+
+    it("should run evaluations on a flow decorator", async () => {
+        let testSetup: TestSetup | undefined = undefined;
+        let flowId: string | null = null;
+
+        try {
+            // Use fixtures from testSetup
+            testSetup = await setupTestEnvironment("eval-flow-decorator");
+            if (!testSetup.evalDataset || !testSetup.outputNotNullEvaluator) {
+                throw new Error("Required fixtures are not initialized");
+            }
+
+            // Create test flow path
+            const flowPath = `${testSetup.sdkTestDir.path}/test_flow_evaluate`;
+
+            // Define flow decorated function
+            const myFlow = testSetup.humanloopClient.flow({
+                path: flowPath,
+                callable: async (inputs: { question: string }) => {
+                    return "paris";
+                },
+            });
+
+            // Run evaluation on the flow
+            await testSetup.humanloopClient.evaluations.run({
+                name: "Evaluate Flow Decorator",
+                file: {
+                    path: flowPath,
+                    callable: myFlow,
+                    type: "flow",
+                },
+                dataset: {
+                    path: testSetup.evalDataset.path,
+                },
+                evaluators: [
+                    {
+                        path: testSetup.outputNotNullEvaluator.path,
+                    },
+                ],
+            });
+
+            // Get the flow ID for cleanup
+            const flowResponse = await testSetup.humanloopClient.files.retrieveByPath({
+                path: flowPath,
+            });
+            flowId = flowResponse.id;
+        } finally {
+            if (testSetup) {
+                await cleanupTestEnvironment(
+                    testSetup,
+                    flowId
+                        ? [
+                              {
+                                  type: "flow",
+                                  id: flowId,
+                              },
+                          ]
+                        : [],
+                );
+            }
+        }
+    });
+
+    it("should throw error when using non-existent file ID instead of path", async () => {
+        // Use fixtures from testSetup
+        let testSetup: TestSetup | undefined = undefined;
+        try {
+            testSetup = await setupTestEnvironment("eval-flow-decorator");
+            if (!testSetup.evalDataset || !testSetup.outputNotNullEvaluator) {
+                throw new Error("Required fixtures are not initialized");
+            }
+            // Define a simple callable
+            const simpleCallable = (x: any) => x;
+
+            // Expect the evaluation to throw an error with a non-existent file ID
+            try {
+                await testSetup.humanloopClient.evaluations.run({
+                    name: "Evaluate Flow Decorator",
+                    file: {
+                        id: "non-existent-file-id",
+                        type: "flow",
+                        version: {
+                            attributes: {
+                                foo: "bar",
+                            },
+                        },
+                        callable: simpleCallable,
+                    },
+                    dataset: {
+                        path: testSetup.evalDataset.path,
+                    },
+                    evaluators: [
+                        {
+                            path: testSetup.outputNotNullEvaluator.path,
+                        },
+                    ],
+                });
+
+                // If we get here, the test should fail
+                throw new Error("Expected HumanloopRuntimeError but none was thrown");
+            } catch (error) {
+                expect(error).toBeInstanceOf(HumanloopRuntimeError);
+                expect((error as HumanloopRuntimeError).message).toContain(
+                    "File does not exist on Humanloop. Please provide a `file.path` and a version to create a new version.",
+                );
+            }
+        } finally {
+            if (testSetup) {
+                await cleanupTestEnvironment(testSetup);
+            }
+        }
+    });
+});
diff --git a/tests/custom/integration/evals.test.ts b/tests/custom/integration/evals.test.ts
new file mode 100644
index 00000000..09e3b9bf
--- /dev/null
+++ b/tests/custom/integration/evals.test.ts
@@ -0,0 +1,577 @@
+import { FlowResponse } from "../../../src/api";
+import { HumanloopRuntimeError } from "../../../src/error";
+import { HumanloopClient } from "../../../src/humanloop.client";
+import {
+    cleanupTestEnvironment,
+    readEnvironment,
+    setupTestEnvironment,
+} from "./fixtures";
+
+// process.stdout.moveCursor is undefined in jest; mocking it since STDOUT is not relevant
+if (typeof process.stdout.moveCursor !== "function") {
+    process.stdout.moveCursor = (
+        dx: number,
+        dy: number,
+        callback?: () => void,
+    ): boolean => {
+        if (callback) callback();
+        return true;
+    };
+}
+
+// Long timeout per test; evals might take a while to run
+jest.setTimeout(30 * 1000);
+
+interface TestIdentifiers {
+    id: string;
+    path: string;
+}
+
+interface TestSetup {
+    sdkTestDir: TestIdentifiers;
+    outputNotNullEvaluator: TestIdentifiers;
+    evalDataset: TestIdentifiers;
+    evalPrompt: TestIdentifiers;
+    stagingEnvironmentId: string;
+}
+
+describe("Evals", () => {
+    let humanloopClient: HumanloopClient;
+    let openaiApiKey: string;
+
+    beforeAll(async () => {
+        readEnvironment();
+        if (!process.env.HUMANLOOP_API_KEY) {
+            throw new Error("HUMANLOOP_API_KEY is not set");
+        }
+        if (!process.env.OPENAI_API_KEY) {
+            throw new Error("OPENAI_API_KEY is not set for integration tests");
+        }
+        openaiApiKey = process.env.OPENAI_API_KEY;
+        humanloopClient = new HumanloopClient({
+            apiKey: process.env.HUMANLOOP_API_KEY,
+        });
+    });
+
+    it("should be able to import HumanloopClient", async () => {
+        const client = new HumanloopClient({ apiKey: process.env.HUMANLOOP_API_KEY });
+        expect(client).toBeDefined();
+    });
+
+    it("should run evaluation on online files", async () => {
+        // Setup test-specific environment
+        const setup = await setupTestEnvironment("online_files");
+
+        try {
+            await humanloopClient.evaluations.run({
+                file: {
+                    path: setup.evalPrompt.path,
+                    type: "prompt",
+                },
+                dataset: {
+                    path: setup.evalDataset.path,
+                },
+                name: "test_eval_run",
+                evaluators: [
+                    {
+                        path: setup.outputNotNullEvaluator.path,
+                    },
+                ],
+            });
+
+            // Wait for evaluation to complete
+            await new Promise((resolve) => setTimeout(resolve, 5000));
+
+            const evalResponse = await humanloopClient.evaluations.list({
+                fileId: setup.evalPrompt.id,
+            });
+            expect(evalResponse.data.length).toBe(1);
+
+            const evaluationId = evalResponse.data[0].id;
+            const runsResponse =
+                await humanloopClient.evaluations.listRunsForEvaluation(evaluationId);
+            expect(runsResponse.runs[0].status).toBe("completed");
+        } finally {
+            // Clean up test-specific resources
+            await cleanupTestEnvironment(setup);
+        }
+    });
+
+    it("should run evaluation with version_id", async () => {
+        // Setup test-specific environment
+        const setup = await setupTestEnvironment("version_id");
+
+        try {
+            // Create a new prompt version
+            const newPromptVersionResponse = await humanloopClient.prompts.upsert({
+                path: setup.evalPrompt.path,
+                provider: "openai",
+                model: "gpt-4o-mini",
+                temperature: 0,
+                template: [
+                    {
+                        role: "system",
+                        content:
+                            "You are a helpful assistant. You must answer the user's question truthfully and at the level of a 5th grader.",
+                    },
+                    {
+                        role: "user",
+                        content: "{{question}}",
+                    },
+                ],
+            });
+
+            // Run evaluation with version_id
+            await humanloopClient.evaluations.run({
+                file: {
+                    id: newPromptVersionResponse.id,
+                    versionId: newPromptVersionResponse.versionId,
+                    type: "prompt",
+                },
+                dataset: {
+                    path: setup.evalDataset.path,
+                },
+                name: "test_eval_run",
+                evaluators: [
+                    {
+                        path: setup.outputNotNullEvaluator.path,
+                    },
+                ],
+            });
+
+            // Verify evaluation
+            const evaluationsResponse = await humanloopClient.evaluations.list({
+                fileId: newPromptVersionResponse.id,
+            });
+            expect(evaluationsResponse.data.length).toBe(1);
+
+            const evaluationId = evaluationsResponse.data[0].id;
+            const runsResponse =
+                await humanloopClient.evaluations.listRunsForEvaluation(evaluationId);
+            expect(runsResponse.runs[0].status).toBe("completed");
+            if (runsResponse.runs[0].version) {
+                expect(runsResponse.runs[0].version.versionId).toBe(
+                    newPromptVersionResponse.versionId,
+                );
+            }
+
+            // Verify version is not the default
+            const response = await humanloopClient.prompts.get(
+                newPromptVersionResponse.id,
+            );
+            expect(response.versionId).not.toBe(newPromptVersionResponse.versionId);
+        } finally {
+            // Clean up test-specific resources
+            await cleanupTestEnvironment(setup);
+        }
+    });
+
+    it("should run evaluation with environment", async () => {
+        // Setup test-specific environment
+        const setup = await setupTestEnvironment("environment");
+
+        try {
+            // Create a new prompt version and deploy to staging
+            const newPromptVersionResponse = await humanloopClient.prompts.upsert({
+                path: setup.evalPrompt.path,
+                provider: "openai",
+                model: "gpt-4o-mini",
+                temperature: 0,
+                template: [
+                    {
+                        role: "system",
+                        content:
+                            "You are a helpful assistant. You must answer the user's question truthfully and at the level of a 5th grader.",
+                    },
+                    {
+                        role: "user",
+                        content: "{{question}}",
+                    },
+                ],
+            });
+
+            await humanloopClient.prompts.setDeployment(
+                newPromptVersionResponse.id,
+                setup.stagingEnvironmentId,
+                {
+                    versionId: newPromptVersionResponse.versionId,
+                },
+            );
+
+            // Run evaluation with environment
+            await humanloopClient.evaluations.run({
+                file: {
+                    id: newPromptVersionResponse.id,
+                    type: "prompt",
+                    environment: "staging",
+                },
+                dataset: {
+                    path: setup.evalDataset.path,
+                },
+                name: "test_eval_run",
+                evaluators: [
+                    {
+                        path: setup.outputNotNullEvaluator.path,
+                    },
+                ],
+            });
+
+            // Verify evaluation
+            const evaluationsResponse = await humanloopClient.evaluations.list({
+                fileId: newPromptVersionResponse.id,
+            });
+            expect(evaluationsResponse.data.length).toBe(1);
+
+            const evaluationId = evaluationsResponse.data[0].id;
+            const runsResponse =
+                await humanloopClient.evaluations.listRunsForEvaluation(evaluationId);
+            expect(runsResponse.runs[0].status).toBe("completed");
+            if (runsResponse.runs[0].version) {
+                expect(runsResponse.runs[0].version.versionId).toBe(
+                    newPromptVersionResponse.versionId,
+                );
+            }
+
+            const defaultPromptVersionResponse = await humanloopClient.prompts.get(
+                newPromptVersionResponse.id,
+            );
+            expect(defaultPromptVersionResponse.versionId).not.toBe(
+                newPromptVersionResponse.versionId,
+            );
+        } finally {
+            // Clean up test-specific resources
+            await cleanupTestEnvironment(setup);
+        }
+    });
+
+    it("should fail when using version_id with path", async () => {
+        // Setup test-specific environment
+        const setup = await setupTestEnvironment("fail_with_version_id");
+
+        try {
+            try {
+                await humanloopClient.evaluations.run({
+                    file: {
+                        path: setup.evalPrompt.path,
+                        type: "prompt",
+                        versionId: "will_not_work",
+                    },
+                    dataset: {
+                        path: setup.evalDataset.path,
+                    },
+                    name: "test_eval_run",
+                    evaluators: [
+                        {
+                            path: setup.outputNotNullEvaluator.path,
+                        },
+                    ],
+                });
+                // If we got here, the test failed
+                throw new Error("Expected runtime error but none was thrown");
+            } catch (error: any) {
+                if (error instanceof HumanloopRuntimeError) {
+                    expect(error.message).toContain(
+                        "You must provide the `file.id` when addressing a file by version ID or environment",
+                    );
+                } else {
+                    throw new Error(
+                        `Expected test to fail for version_id but got ${error}`,
+                    );
+                }
+            }
+        } finally {
+            // Clean up test-specific resources
+            await cleanupTestEnvironment(setup);
+        }
+    });
+
+    it("should fail when using environment with path", async () => {
+        // Setup test-specific environment
+        const setup = await setupTestEnvironment("fail_with_environment");
+
+        try {
+            await humanloopClient.evaluations.run({
+                file: {
+                    path: setup.evalPrompt.path,
+                    type: "prompt",
+                    environment: "staging",
+                },
+                dataset: {
+                    path: setup.evalDataset.path,
+                },
+                name: "test_eval_run",
+                evaluators: [
+                    {
+                        path: setup.outputNotNullEvaluator.path,
+                    },
+                ],
+            });
+            // If we got here, the test failed
+            throw new Error("Expected runtime error but none was thrown");
+        } catch (error: any) {
+            if (error instanceof HumanloopRuntimeError) {
+                expect(error.message).toContain(
+                    "You must provide the `file.id` when addressing a file by version ID or environment",
+                );
+            } else {
+                throw new Error(
+                    `Expected test to fail for environment but got ${error}`,
+                );
+            }
+        } finally {
+            // Clean up test-specific resources
+            await cleanupTestEnvironment(setup);
+        }
+    });
+
+    it("should run evaluation with version upsert", async () => {
+        // Setup test-specific environment
+        const setup = await setupTestEnvironment("version_upsert");
+
+        try {
+            await humanloopClient.evaluations.run({
+                file: {
+                    path: setup.evalPrompt.path,
+                    type: "prompt",
+                    version: {
+                        provider: "openai",
+                        model: "gpt-4o-mini",
+                        temperature: 1,
+                        template: [
+                            {
+                                role: "system",
+                                content:
+                                    "You are a helpful assistant. You must answer the user's question truthfully and at the level of a 5th grader.",
+                            },
+                            {
+                                role: "user",
+                                content: "{{question}}",
+                            },
+                        ],
+                    },
+                },
+                dataset: {
+                    path: setup.evalDataset.path,
+                },
+                name: "test_eval_run",
+                evaluators: [
+                    {
+                        path: setup.outputNotNullEvaluator.path,
+                    },
+                ],
+            });
+
+            // Verify evaluation
+            const evaluationsResponse = await humanloopClient.evaluations.list({
+                fileId: setup.evalPrompt.id,
+            });
+            expect(evaluationsResponse.data.length).toBe(1);
+
+            const evaluationId = evaluationsResponse.data[0].id;
+            const runsResponse =
+                await humanloopClient.evaluations.listRunsForEvaluation(evaluationId);
+            expect(runsResponse.runs[0].status).toBe("completed");
+
+            // Verify version upsert
+            const listPromptVersionsResponse =
+                await humanloopClient.prompts.listVersions(setup.evalPrompt.id);
+            expect(listPromptVersionsResponse.records.length).toBe(2);
+        } finally {
+            // Clean up test-specific resources
+            await cleanupTestEnvironment(setup);
+        }
+    });
+
+    it("should fail flow eval without callable", async () => {
+        // Setup test-specific environment
+        const setup = await setupTestEnvironment("flow_fail_without_callable");
+
+        try {
+            try {
+                await humanloopClient.evaluations.run({
+                    file: {
+                        path: "Test Flow",
+                        type: "flow",
+                        version: {
+                            attributes: {
+                                foo: "bar",
+                            },
+                        },
+                    },
+                    dataset: {
+                        path: setup.evalDataset.path,
+                    },
+                    name: "test_eval_run",
+                    evaluators: [
+                        {
+                            path: setup.outputNotNullEvaluator.path,
+                        },
+                    ],
+                });
+                // If we got here, the test failed
+                fail("Expected runtime error but none was thrown");
+            } catch (error: any) {
+                expect(error.message).toContain(
+                    "You must provide a `callable` for your Flow `file` to run a local eval.",
+                );
+            }
+        } finally {
+            // Clean up test-specific resources
+            await cleanupTestEnvironment(setup);
+        }
+    });
+
+    it("should run flow eval with callable", async () => {
+        // Setup test-specific environment
+        const setup = await setupTestEnvironment("flow_with_callable");
+
+        try {
+            const flowPath = `${setup.sdkTestDir.path}/Test Flow`;
+
+            // Create flow
+            const flowResponse = await humanloopClient.flows.upsert({
+                path: flowPath,
+                attributes: {
+                    foo: "bar",
+                },
+            });
+
+            try {
+                const flow = await humanloopClient.flows.upsert({
+                    path: flowPath,
+                    attributes: {
+                        foo: "bar",
+                    },
+                });
+
+                // Run evaluation with flow
+                await humanloopClient.evaluations.run({
+                    file: {
+                        id: flow.id,
+                        type: "flow",
+                        callable: ({ question }) =>
+                            "It's complicated don't worry about it",
+                        version: {
+                            attributes: {
+                                foo: "bar",
+                            },
+                        },
+                    },
+                    dataset: {
+                        path: setup.evalDataset.path,
+                    },
+                    name: "test_eval_run",
+                    evaluators: [
+                        {
+                            path: setup.outputNotNullEvaluator.path,
+                        },
+                    ],
+                });
+
+                // Verify evaluation
+                const evaluationsResponse = await humanloopClient.evaluations.list({
+                    fileId: flow.id,
+                });
+                expect(evaluationsResponse.data.length).toBe(1);
+
+                const evaluationId = evaluationsResponse.data[0].id;
+                const runsResponse =
+                    await humanloopClient.evaluations.listRunsForEvaluation(
+                        evaluationId,
+                    );
+                expect(runsResponse.runs[0].status).toBe("completed");
+            } finally {
+                await humanloopClient.flows.delete(flowResponse.id);
+            }
+        } finally {
+            // Clean up test-specific resources
+            await cleanupTestEnvironment(setup);
+        }
+    });
+
+    it("should not allow evaluating agent with callable", async () => {
+        // Setup test-specific environment
+        const setup = await setupTestEnvironment("agent_with_callable");
+
+        try {
+            try {
+                await humanloopClient.evaluations.run({
+                    file: {
+                        path: "Test Agent",
+                        type: "agent",
+                        callable: (inputs: any) => "bar",
+                    },
+                    dataset: {
+                        path: setup.evalDataset.path,
+                    },
+                    name: "test_eval_run",
+                    evaluators: [
+                        {
+                            path: setup.outputNotNullEvaluator.path,
+                        },
+                    ],
+                });
+                // If we got here, the test failed
+                fail("Expected ValueError but none was thrown");
+            } catch (error: any) {
+                expect(error.message).toBe(
+                    "Agent evaluation is only possible on the Humanloop runtime, do not provide a `callable`.",
+                );
+            }
+        } finally {
+            // Clean up test-specific resources
+            await cleanupTestEnvironment(setup);
+        }
+    });
+
+    it("should resolve to default flow version when callable is provided without version", async () => {
+        // Setup test-specific environment
+        const setup = await setupTestEnvironment("flow_with_callable_without_version");
+        let flowResponse: FlowResponse;
+        try {
+            const flowPath = `${setup.sdkTestDir.path}/Test Flow`;
+
+            // Create flow
+            flowResponse = await humanloopClient.flows.upsert({
+                path: flowPath,
+                attributes: {
+                    foo: "bar",
+                },
+            });
+
+            // Run evaluation with flow
+            await humanloopClient.evaluations.run({
+                file: {
+                    id: flowResponse.id,
+                    type: "flow",
+                    callable: ({ question }) => "It's complicated don't worry about it",
+                },
+                dataset: {
+                    path: setup.evalDataset.path,
+                },
+                name: "test_eval_run",
+                evaluators: [
+                    {
+                        path: setup.outputNotNullEvaluator.path,
+                    },
+                ],
+            });
+
+            // Verify evaluation
+            const evaluationsResponse = await humanloopClient.evaluations.list({
+                fileId: flowResponse.id,
+            });
+            expect(evaluationsResponse.data.length).toBe(1);
+
+            const evaluationId = evaluationsResponse.data[0].id;
+            const runsResponse =
+                await humanloopClient.evaluations.listRunsForEvaluation(evaluationId);
+            expect(runsResponse.runs[0].status).toBe("completed");
+        } finally {
+            // Clean up test-specific resources
+            await cleanupTestEnvironment(setup, [
+                { id: flowResponse!.id, type: "flow" },
+            ]);
+        }
+    });
+});
diff --git a/tests/custom/integration/fixtures.ts b/tests/custom/integration/fixtures.ts
new file mode 100644
index 00000000..c7ba73b9
--- /dev/null
+++ b/tests/custom/integration/fixtures.ts
@@ -0,0 +1,345 @@
+import dotenv from "dotenv";
+import { OpenAI } from "openai";
+import { v4 as uuidv4 } from "uuid";
+
+import { FileType, PromptRequest, PromptResponse } from "../../../src/api";
+import { HumanloopClient } from "../../../src/humanloop.client";
+
+export interface ResourceIdentifiers {
+    id: string;
+    path: string;
+}
+
+export interface TestPrompt {
+    id: string;
+    path: string;
+    response: PromptResponse;
+}
+
+export interface SyncableFile {
+    path: string;
+    type: "prompt" | "agent";
+    model: string;
+    id?: string;
+    versionId?: string;
+}
+
+export interface TestSetup {
+    sdkTestDir: ResourceIdentifiers;
+    testPromptConfig: PromptRequest;
+    openaiApiKey: string;
+    humanloopClient: HumanloopClient;
+    evalDataset: ResourceIdentifiers;
+    evalPrompt: ResourceIdentifiers;
+    stagingEnvironmentId: string;
+    outputNotNullEvaluator: ResourceIdentifiers;
+}
+
+export interface CleanupResources {
+    type: FileType;
+    id: string;
+}
+
+export function readEnvironment(): void {
+    if (![process.env.HUMANLOOP_API_KEY, process.env.OPENAI_API_KEY].every(Boolean)) {
+        // Testing locally not in CI, running dotenv.config() would override the secrets set for GitHub Action
+        dotenv.config({});
+    }
+    if (!process.env.HUMANLOOP_API_KEY) {
+        throw new Error("HUMANLOOP_API_KEY is not set");
+    }
+    if (!process.env.OPENAI_API_KEY) {
+        throw new Error("OPENAI_API_KEY is not set for integration tests");
+    }
+}
+
+export function getSubclient(client: HumanloopClient, type: FileType) {
+    switch (type) {
+        case "prompt":
+            return client.prompts;
+        case "tool":
+            return client.tools;
+        case "flow":
+            return client.flows;
+        case "agent":
+            return client.agents;
+        case "dataset":
+            return client.datasets;
+        case "evaluator":
+            return client.evaluators;
+        default:
+            throw new Error(`Unsupported file type: ${type}`);
+    }
+}
+
+export async function setupTestEnvironment(testName: string): Promise<TestSetup> {
+    readEnvironment();
+
+    const openaiApiKey = process.env.OPENAI_API_KEY!;
+    const humanloopClient = new HumanloopClient({
+        apiKey: process.env.HUMANLOOP_API_KEY,
+        instrumentProviders: {
+            OpenAI: OpenAI,
+        },
+    });
+
+    // Create a test directory
+    const directoryPath = `SDK_TEST_${testName}_${uuidv4()}`;
+    const response = await humanloopClient.directories.create({
+        path: directoryPath,
+    });
+
+    const sdkTestDir = {
+        id: response.id,
+        path: response.path,
+    };
+
+    // Create test prompt config
+    const testPromptConfig: PromptRequest = {
+        provider: "openai",
+        model: "gpt-4o-mini",
+        temperature: 0.5,
+        template: [
+            {
+                role: "system",
+                content: "You are a helpful assistant. Answer concisely.",
+            },
+            {
+                role: "user",
+                content: "{{question}}",
+            },
+        ],
+    };
+
+    // Create evaluator for testing
+    const evaluatorPath = `${sdkTestDir.path}/output_not_null_evaluator`;
+    const evaluatorResponse = await humanloopClient.evaluators.upsert({
+        path: evaluatorPath,
+        spec: {
+            argumentsType: "target_required",
+            returnType: "boolean",
+            code: `
+def output_not_null(log: dict) -> bool:
+    return log["output"] is not None
+            `,
+            evaluatorType: "python",
+        },
+    });
+    const outputNotNullEvaluator = {
+        id: evaluatorResponse.id,
+        path: evaluatorPath,
+    };
+
+    // Create dataset for testing
+    const datasetPath = `${sdkTestDir.path}/eval_dataset`;
+    const datasetResponse = await humanloopClient.datasets.upsert({
+        path: datasetPath,
+        datapoints: [
+            {
+                inputs: { question: "What is the capital of the France?" },
+                target: { output: "Paris" },
+            },
+            {
+                inputs: { question: "What is the capital of the Germany?" },
+                target: { output: "Berlin" },
+            },
+            {
+                inputs: { question: "What is 2+2?" },
+                target: { output: "4" },
+            },
+        ],
+    });
+    const evalDataset = {
+        id: datasetResponse.id,
+        path: datasetResponse.path,
+    };
+
+    // Create prompt
+    const promptPath = `${sdkTestDir.path}/eval_prompt`;
+    const promptResponse = await humanloopClient.prompts.upsert({
+        path: promptPath,
+        ...(testPromptConfig as PromptRequest),
+    });
+    const evalPrompt = {
+        id: promptResponse.id,
+        path: promptResponse.path,
+    };
+
+    // Get staging environment ID
+    const environmentsResponse = await humanloopClient.prompts.listEnvironments(
+        evalPrompt.id,
+    );
+    let stagingEnvironmentId = "";
+    for (const environment of environmentsResponse) {
+        if (environment.name === "staging") {
+            stagingEnvironmentId = environment.id;
+            break;
+        }
+    }
+    if (!stagingEnvironmentId) {
+        throw new Error("Staging environment not found");
+    }
+
+    return {
+        testPromptConfig,
+        openaiApiKey,
+        humanloopClient,
+        sdkTestDir,
+        outputNotNullEvaluator,
+        evalDataset,
+        evalPrompt,
+        stagingEnvironmentId,
+    };
+}
+
+/**
+ * Cleans up all test resources
+ * @param setup The test setup containing the resources
+ * @param resources Additional resources to clean up
+ */
+export async function cleanupTestEnvironment(
+    setup: TestSetup,
+    resources?: CleanupResources[],
+): Promise<void> {
+    try {
+        // First clean up any additional resources
+        if (resources) {
+            for (const resource of resources) {
+                try {
+                    const subclient = getSubclient(
+                        setup.humanloopClient,
+                        resource.type,
+                    );
+                    if (resource.id) {
+                        await subclient.delete(resource.id);
+                    }
+                } catch (error) {
+                    console.warn(
+                        `Failed to delete ${resource.type} ${resource.id}:`,
+                        error,
+                    );
+                }
+            }
+        }
+
+        // Sleep a bit to let API operations settle
+        await new Promise((resolve) => setTimeout(resolve, 3000));
+
+        // Recursively clean up the test directory
+        try {
+            if (setup.sdkTestDir.id) {
+                await cleanupDirectory(setup.humanloopClient, setup.sdkTestDir.id);
+            }
+        } catch (error) {
+            console.warn(`Failed to clean up test directory: ${error}`);
+        }
+    } catch (error) {
+        console.error("Error during cleanup:", error);
+    }
+}
+
+/**
+ * Recursively cleans up a directory and all its contents
+ * Mirrors the Python SDK's cleanup_directory function
+ * @param client The Humanloop client
+ * @param directoryId ID of the directory to clean
+ */
+async function cleanupDirectory(
+    client: HumanloopClient,
+    directoryId: string,
+): Promise<void> {
+    try {
+        // Get directory details
+        const directory = await client.directories.get(directoryId);
+
+        // First, recursively clean up subdirectories
+        for (const subdirectory of directory.subdirectories) {
+            await cleanupDirectory(client, subdirectory.id);
+        }
+
+        // Then delete all files in this directory
+        for (const file of directory.files) {
+            try {
+                const subclient = getSubclient(client, file.type as FileType);
+                await subclient.delete(file.id);
+            } catch (error) {
+                console.warn(`Failed to delete ${file.type} ${file.id}: ${error}`);
+            }
+        }
+
+        // Finally delete this directory
+        await client.directories.delete(directoryId);
+    } catch (error) {
+        console.warn(`Error cleaning directory ${directoryId}: ${error}`);
+    }
+}
+
+/**
+ * Creates a predefined structure of files in Humanloop for testing sync
+ */
+export async function createSyncableFilesFixture(
+    testSetup: TestSetup,
+): Promise<SyncableFile[]> {
+    const fileDefinitions: SyncableFile[] = [
+        {
+            path: "prompts/gpt-4",
+            type: "prompt",
+            model: "gpt-4o-mini",
+        },
+        {
+            path: "prompts/gpt-4o",
+            type: "prompt",
+            model: "gpt-4o-mini",
+        },
+        {
+            path: "prompts/nested/complex/gpt-4o",
+            type: "prompt",
+            model: "gpt-4o-mini",
+        },
+        {
+            path: "agents/gpt-4",
+            type: "agent",
+            model: "gpt-4o-mini",
+        },
+        {
+            path: "agents/gpt-4o",
+            type: "agent",
+            model: "gpt-4o-mini",
+        },
+    ];
+
+    const createdFiles: SyncableFile[] = [];
+
+    for (const file of fileDefinitions) {
+        const fullPath = `${testSetup.sdkTestDir.path}/${file.path}`;
+        let response;
+
+        try {
+            if (file.type === "prompt") {
+                response = await testSetup.humanloopClient.prompts.upsert({
+                    path: fullPath,
+                    model: file.model,
+                });
+            } else if (file.type === "agent") {
+                response = await testSetup.humanloopClient.agents.upsert({
+                    path: fullPath,
+                    model: file.model,
+                });
+            }
+
+            if (response) {
+                createdFiles.push({
+                    path: fullPath,
+                    type: file.type,
+                    model: file.model,
+                    id: response.id,
+                    versionId: response.versionId,
+                });
+            }
+        } catch (error) {
+            console.warn(`Failed to create ${file.type} at ${fullPath}: ${error}`);
+        }
+    }
+
+    return createdFiles;
+}
diff --git a/tests/custom/integration/localFileOperations.test.ts b/tests/custom/integration/localFileOperations.test.ts
new file mode 100644
index 00000000..4f5da986
--- /dev/null
+++ b/tests/custom/integration/localFileOperations.test.ts
@@ -0,0 +1,404 @@
+import * as fs from "fs";
+import * as path from "path";
+
+import { ChatMessage } from "../../../src/api";
+import { HumanloopRuntimeError } from "../../../src/error";
+import { HumanloopClient } from "../../../src/humanloop.client";
+import { createTempDir } from "../fixtures";
+import {
+    TestSetup,
+    cleanupTestEnvironment,
+    createSyncableFilesFixture,
+    setupTestEnvironment,
+} from "./fixtures";
+
+// Define SyncableFile interface to match Python version
+interface SyncableFile {
+    path: string;
+    type: "prompt" | "agent";
+    model: string;
+    id?: string;
+    versionId?: string;
+}
+
+interface PathTestCase {
+    name: string;
+    pathGenerator: (file: SyncableFile) => string;
+    shouldPass: boolean;
+    expectedError?: string; // Only required when shouldPass is false
+}
+
+describe("Local File Operations Integration Tests", () => {
+    let testSetup: TestSetup;
+    let syncableFiles: SyncableFile[] = [];
+    let tempDirInfo: { tempDir: string; cleanup: () => void };
+
+    beforeAll(async () => {
+        // Increase timeout for setup operations
+        jest.setTimeout(30000); // 30 seconds
+
+        // Set up test environment
+        testSetup = await setupTestEnvironment("local_file_ops");
+        tempDirInfo = createTempDir("local-file-integration");
+
+        // Create test files in Humanloop for syncing
+        syncableFiles = await createSyncableFilesFixture(testSetup);
+
+        // Pull files for tests that need them pre-pulled
+        const setupClient = new HumanloopClient({
+            apiKey: process.env.HUMANLOOP_API_KEY,
+            localFilesDirectory: tempDirInfo.tempDir,
+            useLocalFiles: true,
+        });
+
+        await setupClient.pull();
+    }, 30000);
+
+    afterAll(async () => {
+        // Clean up resources
+        tempDirInfo.cleanup();
+        await cleanupTestEnvironment(
+            testSetup,
+            syncableFiles.map((file) => ({
+                type: file.type as any,
+                id: file.id as string,
+            })),
+        );
+    }, 30000);
+
+    describe("Path Validation", () => {
+        // Path validation test cases
+        const pathTestCases = [
+            // Basic path test cases
+            {
+                name: "With whitespace",
+                pathGenerator: (file: SyncableFile) => ` ${file.path} `,
+                shouldPass: true,
+            },
+            {
+                name: "Standard extension",
+                pathGenerator: (file: SyncableFile) => `${file.path}.${file.type}`,
+                expectedError: "should not include any file extension",
+            },
+            {
+                name: "Uppercase extension",
+                pathGenerator: (file: SyncableFile) =>
+                    `${file.path}.${file.type.toUpperCase()}`,
+                expectedError: "should not include any file extension",
+            },
+            {
+                name: "Mixed case extension",
+                pathGenerator: (file: SyncableFile) =>
+                    `${file.path}.${file.type.charAt(0).toUpperCase() + file.type.slice(1)}`,
+                expectedError: "should not include any file extension",
+            },
+            // Slash path test cases
+            {
+                name: "Trailing slash",
+                pathGenerator: (file: SyncableFile) => `${file.path}/`,
+                expectedError: "Path .* format is invalid",
+            },
+            {
+                name: "Leading slash",
+                pathGenerator: (file: SyncableFile) => `/${file.path}`,
+                expectedError: "Path .* format is invalid",
+            },
+            {
+                name: "Both leading and trailing slashes",
+                pathGenerator: (file: SyncableFile) => `/${file.path}/`,
+                expectedError: "Path .* format is invalid",
+            },
+            {
+                name: "Multiple leading and trailing slashes",
+                pathGenerator: (file: SyncableFile) => `//${file.path}//`,
+                expectedError: "Path .* format is invalid",
+            },
+            // Combined path test cases
+            {
+                name: "Extension and trailing slash",
+                pathGenerator: (file: SyncableFile) => `${file.path}.${file.type}/`,
+                expectedError: "Path .* format is invalid",
+            },
+            {
+                name: "Extension and leading slash",
+                pathGenerator: (file: SyncableFile) => `/${file.path}.${file.type}`,
+                expectedError: "Path .* format is invalid",
+            },
+        ];
+
+        // Test all path validation cases
+        test.each(pathTestCases)(
+            "should $shouldPass ? 'accept' : 'reject' $name path format",
+            async ({ pathGenerator, expectedError, shouldPass }) => {
+                // GIVEN a client with local files enabled and a test file
+                const client = new HumanloopClient({
+                    apiKey: process.env.HUMANLOOP_API_KEY,
+                    localFilesDirectory: tempDirInfo.tempDir,
+                    useLocalFiles: true,
+                });
+
+                const testFile = syncableFiles[0];
+                const testPath = pathGenerator(testFile);
+                const testMessage: ChatMessage[] = [
+                    { role: "user", content: "Testing" },
+                ];
+
+                // WHEN using the path
+                if (shouldPass) {
+                    // THEN it should work (just trimming whitespace)
+                    if (testFile.type === "prompt") {
+                        await expect(
+                            client.prompts.call({
+                                path: testPath,
+                                messages: testMessage,
+                            }),
+                        ).resolves.toBeDefined();
+                    } else if (testFile.type === "agent") {
+                        await expect(
+                            client.agents.call({
+                                path: testPath,
+                                messages: testMessage,
+                            }),
+                        ).resolves.toBeDefined();
+                    }
+                } else {
+                    // Type guard to ensure expectedError is defined when shouldPass is false
+                    if (!expectedError) {
+                        throw new Error(
+                            "expectedError must be defined when shouldPass is false",
+                        );
+                    }
+
+                    // THEN appropriate error should be raised
+                    if (testFile.type === "prompt") {
+                        await expect(
+                            client.prompts.call({
+                                path: testPath,
+                                messages: testMessage,
+                            }),
+                        ).rejects.toThrow(new RegExp(expectedError));
+                    } else if (testFile.type === "agent") {
+                        await expect(
+                            client.agents.call({
+                                path: testPath,
+                                messages: testMessage,
+                            }),
+                        ).rejects.toThrow(new RegExp(expectedError));
+                    }
+                }
+            },
+        );
+    });
+
+    test("local_file_call: should call API with local prompt file", async () => {
+        // GIVEN a local prompt file with proper system tag
+        const promptContent = `---
+model: gpt-4o-mini
+temperature: 1.0
+max_tokens: -1
+top_p: 1.0
+presence_penalty: 0.0
+frequency_penalty: 0.0
+provider: openai
+endpoint: chat
+tools: []
+---
+
+<system>
+You are a helpful assistant that provides concise answers. When asked about capitals of countries, 
+you respond with just the capital name, lowercase, with no punctuation or additional text.
+</system>
+`;
+
+        // Create local file structure in temporary directory
+        const testPath = `${testSetup.sdkTestDir.path}/capital_prompt`;
+        const filePath = path.join(tempDirInfo.tempDir, `${testPath}.prompt`);
+        fs.mkdirSync(path.dirname(filePath), { recursive: true });
+        fs.writeFileSync(filePath, promptContent);
+
+        // GIVEN a client with local files enabled
+        const client = new HumanloopClient({
+            apiKey: process.env.HUMANLOOP_API_KEY,
+            localFilesDirectory: tempDirInfo.tempDir,
+            useLocalFiles: true,
+        });
+
+        // WHEN calling the API with the local file path (without extension)
+        const callMessages: ChatMessage[] = [
+            { role: "user", content: "What is the capital of France?" },
+        ];
+        const response = await client.prompts.call({
+            path: testPath,
+            messages: callMessages,
+        });
+
+        // THEN the response should be successful
+        expect(response).toBeDefined();
+        expect(response.logs).toBeDefined();
+        expect(response.logs?.length).toBeGreaterThan(0);
+
+        // AND the response should contain the expected output format (lowercase city name)
+        const output = response.logs?.[0].output;
+        expect(output).toBeDefined();
+        expect(output?.toLowerCase()).toContain("paris");
+
+        // AND the prompt used should match our expected path
+        expect(response.prompt).toBeDefined();
+        expect(response.prompt?.path).toBe(testPath);
+    });
+
+    test("local_file_log: should log data with local prompt file", async () => {
+        // GIVEN a local prompt file with proper system tag
+        const promptContent = `---
+model: gpt-4o-mini
+temperature: 1.0
+max_tokens: -1
+top_p: 1.0
+presence_penalty: 0.0
+frequency_penalty: 0.0
+provider: openai
+endpoint: chat
+tools: []
+---
+
+<system>
+You are a helpful assistant that answers questions about geography.
+</system>
+`;
+
+        // Create local file structure in temporary directory
+        const testPath = `${testSetup.sdkTestDir.path}/geography_prompt`;
+        const filePath = path.join(tempDirInfo.tempDir, `${testPath}.prompt`);
+        fs.mkdirSync(path.dirname(filePath), { recursive: true });
+        fs.writeFileSync(filePath, promptContent);
+
+        // GIVEN a client with local files enabled
+        const client = new HumanloopClient({
+            apiKey: process.env.HUMANLOOP_API_KEY,
+            localFilesDirectory: tempDirInfo.tempDir,
+            useLocalFiles: true,
+        });
+
+        // GIVEN message content to log
+        const testOutput = "Paris is the capital of France.";
+
+        // WHEN logging the data with the local file path
+        const messages: ChatMessage[] = [
+            { role: "user", content: "What is the capital of France?" },
+        ];
+        const response = await client.prompts.log({
+            path: testPath,
+            messages: messages,
+            output: testOutput,
+        });
+
+        // THEN the log should be successful
+        expect(response).toBeDefined();
+        expect(response.promptId).toBeDefined();
+        expect(response.id).toBeDefined(); // log ID
+
+        // WHEN retrieving the logged prompt details
+        const promptDetails = await client.prompts.get(response.promptId);
+
+        // THEN the details should match our expected path
+        expect(promptDetails).toBeDefined();
+        expect(promptDetails.path).toContain(testPath);
+    });
+
+    test("overload_version_environment_handling: should handle version_id and environment parameters", async () => {
+        // GIVEN a client with local files enabled
+        const client = new HumanloopClient({
+            apiKey: process.env.HUMANLOOP_API_KEY,
+            localFilesDirectory: tempDirInfo.tempDir,
+            useLocalFiles: true,
+        });
+
+        const testMessage: ChatMessage[] = [{ role: "user", content: "Testing" }];
+
+        // GIVEN a test file that exists locally
+        const testFile = syncableFiles[0];
+        const extension = `.${testFile.type}`;
+        const localPath = path.join(
+            tempDirInfo.tempDir,
+            `${testFile.path}${extension}`,
+        );
+
+        // THEN the file should exist locally
+        expect(fs.existsSync(localPath)).toBe(true);
+        expect(fs.existsSync(path.dirname(localPath))).toBe(true);
+
+        // WHEN calling with version_id
+        // THEN a HumanloopRuntimeError should be raised
+        if (testFile.type === "prompt") {
+            await expect(
+                client.prompts.call({
+                    path: testFile.path,
+                    versionId: testFile.versionId,
+                    messages: testMessage,
+                }),
+            ).rejects.toThrow(
+                /Cannot use local file.*version_id or environment was specified/,
+            );
+        } else if (testFile.type === "agent") {
+            await expect(
+                client.agents.call({
+                    path: testFile.path,
+                    versionId: testFile.versionId,
+                    messages: testMessage,
+                }),
+            ).rejects.toThrow(
+                /Cannot use local file.*version_id or environment was specified/,
+            );
+        }
+
+        // WHEN calling with environment
+        // THEN a HumanloopRuntimeError should be raised
+        if (testFile.type === "prompt") {
+            await expect(
+                client.prompts.call({
+                    path: testFile.path,
+                    environment: "production",
+                    messages: testMessage,
+                }),
+            ).rejects.toThrow(
+                /Cannot use local file.*version_id or environment was specified/,
+            );
+        } else if (testFile.type === "agent") {
+            await expect(
+                client.agents.call({
+                    path: testFile.path,
+                    environment: "production",
+                    messages: testMessage,
+                }),
+            ).rejects.toThrow(
+                /Cannot use local file.*version_id or environment was specified/,
+            );
+        }
+
+        // WHEN calling with both version_id and environment
+        // THEN a HumanloopRuntimeError should be raised
+        if (testFile.type === "prompt") {
+            await expect(
+                client.prompts.call({
+                    path: testFile.path,
+                    versionId: testFile.versionId,
+                    environment: "staging",
+                    messages: testMessage,
+                }),
+            ).rejects.toThrow(
+                /Cannot use local file.*version_id or environment was specified/,
+            );
+        } else if (testFile.type === "agent") {
+            await expect(
+                client.agents.call({
+                    path: testFile.path,
+                    versionId: testFile.versionId,
+                    environment: "staging",
+                    messages: testMessage,
+                }),
+            ).rejects.toThrow(
+                /Cannot use local file.*version_id or environment was specified/,
+            );
+        }
+    });
+});
diff --git a/tests/custom/unit/LRUCache.test.ts b/tests/custom/unit/LRUCache.test.ts
new file mode 100644
index 00000000..f377165c
--- /dev/null
+++ b/tests/custom/unit/LRUCache.test.ts
@@ -0,0 +1,61 @@
+import LRUCache from "../../../src/cache/LRUCache";
+
+describe("LRUCache", () => {
+    let cache: LRUCache<string, number>;
+
+    beforeEach(() => {
+        cache = new LRUCache<string, number>(3); // Test with small capacity
+    });
+
+    describe("basic operations", () => {
+        it("should set and get values", () => {
+            cache.set("key1", 1);
+            expect(cache.get("key1")).toBe(1);
+        });
+
+        it("should return undefined for non-existent keys", () => {
+            expect(cache.get("nonexistent")).toBeUndefined();
+        });
+
+        it("should handle setting same key multiple times", () => {
+            cache.set("key1", 1);
+            cache.set("key1", 2);
+            expect(cache.get("key1")).toBe(2);
+        });
+    });
+
+    describe("capacity and eviction", () => {
+        it("should evict least recently used item when capacity is reached", () => {
+            cache.set("key1", 1);
+            cache.set("key2", 2);
+            cache.set("key3", 3);
+            cache.set("key4", 4); // Should evict key1
+
+            expect(cache.get("key1")).toBeUndefined();
+            expect(cache.get("key4")).toBe(4);
+        });
+
+        it("should update LRU order on get operations", () => {
+            cache.set("key1", 1);
+            cache.set("key2", 2);
+            cache.set("key3", 3);
+
+            cache.get("key1"); // Make key1 most recently used
+            cache.set("key4", 4); // Should evict key2, not key1
+
+            expect(cache.get("key1")).toBe(1);
+            expect(cache.get("key2")).toBeUndefined();
+        });
+    });
+
+    describe("clear operation", () => {
+        it("should clear all items from cache", () => {
+            cache.set("key1", 1);
+            cache.set("key2", 2);
+            cache.clear();
+
+            expect(cache.get("key1")).toBeUndefined();
+            expect(cache.get("key2")).toBeUndefined();
+        });
+    });
+});
diff --git a/tests/custom/unit/pathUtils.test.ts b/tests/custom/unit/pathUtils.test.ts
new file mode 100644
index 00000000..db71121e
--- /dev/null
+++ b/tests/custom/unit/pathUtils.test.ts
@@ -0,0 +1,78 @@
+import { normalizePath } from "../../../src/pathUtils";
+
+describe("normalizePath", () => {
+    const testCases = [
+        // Basic cases
+        {
+            input: "path/to/file.prompt",
+            expectedWithExtension: "path/to/file.prompt",
+            expectedWithoutExtension: "path/to/file",
+        },
+        {
+            input: "path\\to\\file.agent",
+            expectedWithExtension: "path/to/file.agent",
+            expectedWithoutExtension: "path/to/file",
+        },
+        {
+            input: "/leading/slashes/file.prompt",
+            expectedWithExtension: "leading/slashes/file.prompt",
+            expectedWithoutExtension: "leading/slashes/file",
+        },
+        {
+            input: "trailing/slashes/file.agent/",
+            expectedWithExtension: "trailing/slashes/file.agent",
+            expectedWithoutExtension: "trailing/slashes/file",
+        },
+        {
+            input: "multiple//slashes//file.prompt",
+            expectedWithExtension: "multiple/slashes/file.prompt",
+            expectedWithoutExtension: "multiple/slashes/file",
+        },
+        // Edge cases
+        {
+            input: "path/to/file with spaces.prompt",
+            expectedWithExtension: "path/to/file with spaces.prompt",
+            expectedWithoutExtension: "path/to/file with spaces",
+        },
+        {
+            input: "path/to/file\\with\\backslashes.prompt",
+            expectedWithExtension: "path/to/file/with/backslashes.prompt",
+            expectedWithoutExtension: "path/to/file/with/backslashes",
+        },
+        {
+            input: "path/to/unicode/文件.prompt",
+            expectedWithExtension: "path/to/unicode/文件.prompt",
+            expectedWithoutExtension: "path/to/unicode/文件",
+        },
+        {
+            input: "path/to/special/chars/!@#$%^&*().prompt",
+            expectedWithExtension: "path/to/special/chars/!@#$%^&*().prompt",
+            expectedWithoutExtension: "path/to/special/chars/!@#$%^&*()",
+        },
+    ];
+
+    test.each(testCases)(
+        "normalizes path '$input' correctly",
+        ({ input, expectedWithExtension, expectedWithoutExtension }) => {
+            // Test without stripping extension
+            const resultWithExtension = normalizePath(input, false);
+            expect(resultWithExtension).toBe(expectedWithExtension);
+
+            // Test with extension stripping
+            const resultWithoutExtension = normalizePath(input, true);
+            expect(resultWithoutExtension).toBe(expectedWithoutExtension);
+
+            // Add custom failure messages if needed
+            if (resultWithExtension !== expectedWithExtension) {
+                throw new Error(
+                    `Failed with stripExtension=false for '${input}'. Expected '${expectedWithExtension}', got '${resultWithExtension}'`,
+                );
+            }
+            if (resultWithoutExtension !== expectedWithoutExtension) {
+                throw new Error(
+                    `Failed with stripExtension=true for '${input}'. Expected '${expectedWithoutExtension}', got '${resultWithoutExtension}'`,
+                );
+            }
+        },
+    );
+});