diff --git a/tests/asset_cache.js b/tests/asset_cache.js
index 8d4cb61fc..9d1182014 100644
--- a/tests/asset_cache.js
+++ b/tests/asset_cache.js
@@ -23,10 +23,11 @@ const TEST_IMAGES = Object.freeze({
   beetle: BASE_URL + "beetle.png",
   book_cover: BASE_URL + "book-cover.png",
   corgi: BASE_URL + "corgi.jpg",
+  man_on_car: BASE_URL + "young-man-standing-and-leaning-on-car.jpg",
 });
 
 const TEST_AUDIOS = {
-  mlk: "https://huggingface.co/datasets/Xenova/transformers.js-docs/resolve/main/mlk.npy",
+  mlk: BASE_URL + "mlk.npy",
 };
 
 /** @type {Map<string, RawImage>} */
diff --git a/tests/pipelines/test_pipelines_image_segmentation.js b/tests/pipelines/test_pipelines_image_segmentation.js
new file mode 100644
index 000000000..01d17170b
--- /dev/null
+++ b/tests/pipelines/test_pipelines_image_segmentation.js
@@ -0,0 +1,115 @@
+import { pipeline, ImageSegmentationPipeline } from "../../src/transformers.js";
+
+import { MAX_MODEL_LOAD_TIME, MAX_TEST_EXECUTION_TIME, MAX_MODEL_DISPOSE_TIME, DEFAULT_MODEL_OPTIONS } from "../init.js";
+import { load_cached_image } from "../asset_cache.js";
+
+const PIPELINE_ID = "image-segmentation";
+
+export default () => {
+  describe("Image Segmentation", () => {
+    describe("Panoptic Segmentation", () => {
+      const model_id = "Xenova/detr-resnet-50-panoptic";
+      /** @type {ImageSegmentationPipeline } */
+      let pipe;
+      beforeAll(async () => {
+        pipe = await pipeline(PIPELINE_ID, model_id, DEFAULT_MODEL_OPTIONS);
+      }, MAX_MODEL_LOAD_TIME);
+
+      it(
+        "single",
+        async () => {
+          const image = await load_cached_image("cats");
+
+          const output = await pipe(image);
+
+          // First, check mask shapes
+          for (const item of output) {
+            expect(item.mask.width).toEqual(image.width);
+            expect(item.mask.height).toEqual(image.height);
+            expect(item.mask.channels).toEqual(1);
+            delete item.mask; // No longer needed
+          }
+
+          // Next, compare scores and labels
+          const target = [
+            {
+              score: 0.9918501377105713,
+              label: "cat",
+            },
+            {
+              score: 0.9985815286636353,
+              label: "remote",
+            },
+            {
+              score: 0.999537467956543,
+              label: "remote",
+            },
+            {
+              score: 0.9919270277023315,
+              label: "couch",
+            },
+            {
+              score: 0.9993696808815002,
+              label: "cat",
+            },
+          ];
+
+          expect(output).toBeCloseToNested(target, 2);
+        },
+        MAX_TEST_EXECUTION_TIME,
+      );
+
+      afterAll(async () => {
+        await pipe.dispose();
+      }, MAX_MODEL_DISPOSE_TIME);
+    });
+
+    describe("Semantic Segmentation", () => {
+      const model_id = "Xenova/segformer_b0_clothes";
+      /** @type {ImageSegmentationPipeline } */
+      let pipe;
+      beforeAll(async () => {
+        pipe = await pipeline(PIPELINE_ID, model_id, DEFAULT_MODEL_OPTIONS);
+      }, MAX_MODEL_LOAD_TIME);
+
+      it(
+        "single",
+        async () => {
+          const image = await load_cached_image("man_on_car");
+
+          const output = await pipe(image);
+
+          // First, check mask shapes
+          for (const item of output) {
+            expect(item.mask.width).toEqual(image.width);
+            expect(item.mask.height).toEqual(image.height);
+            expect(item.mask.channels).toEqual(1);
+            delete item.mask; // No longer needed
+          }
+
+          // Next, compare scores and labels
+          const target = [
+            { score: null, label: "Background" },
+            { score: null, label: "Hair" },
+            { score: null, label: "Upper-clothes" },
+            { score: null, label: "Pants" },
+            { score: null, label: "Left-shoe" },
+            { score: null, label: "Right-shoe" },
+            { score: null, label: "Face" },
+            { score: null, label: "Right-leg" },
+            { score: null, label: "Left-arm" },
+            { score: null, label: "Right-arm" },
+            { score: null, label: "Bag" },
+          ];
+
+          expect(output).toBeCloseToNested(target, 2);
+        },
+        MAX_TEST_EXECUTION_TIME,
+      );
+
+      afterAll(async () => {
+        await pipe.dispose();
+      }, MAX_MODEL_DISPOSE_TIME);
+    });
+  });
+};