diff --git a/Cargo.lock b/Cargo.lock
index 611ef2dd..58105093 100644
--- a/Cargo.lock
+++ b/Cargo.lock
@@ -31,6 +31,24 @@ dependencies = [
  "memchr",
 ]
 
+[[package]]
+name = "aligned"
+version = "0.4.3"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "ee4508988c62edf04abd8d92897fca0c2995d907ce1dfeaf369dac3716a40685"
+dependencies = [
+ "as-slice",
+]
+
+[[package]]
+name = "aligned-vec"
+version = "0.6.4"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "dc890384c8602f339876ded803c97ad529f3842aba97f6392b3dba0dd171769b"
+dependencies = [
+ "equator",
+]
+
 [[package]]
 name = "android_system_properties"
 version = "0.1.5"
@@ -105,6 +123,12 @@ dependencies = [
  "num-traits",
 ]
 
+[[package]]
+name = "arbitrary"
+version = "1.4.2"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "c3d036a3c4ab069c7b410a2ce876bd74808d2d0888a82667669f8e783a898bf1"
+
 [[package]]
 name = "arc-swap"
 version = "1.9.1"
@@ -114,6 +138,32 @@ dependencies = [
  "rustversion",
 ]
 
+[[package]]
+name = "arg_enum_proc_macro"
+version = "0.3.4"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "0ae92a5119aa49cdbcf6b9f893fe4e1d98b04ccbf82ee0584ad948a44a734dea"
+dependencies = [
+ "proc-macro2",
+ "quote",
+ "syn",
+]
+
+[[package]]
+name = "arrayvec"
+version = "0.7.6"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "7c02d123df017efcdfbd739ef81735b36c5ba83ec3c59c80a9d7ecc718f92e50"
+
+[[package]]
+name = "as-slice"
+version = "0.2.1"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "516b6b4f0e40d50dcda9365d53964ec74560ad4284da2e7fc97122cd83174516"
+dependencies = [
+ "stable_deref_trait",
+]
+
 [[package]]
 name = "async-trait"
 version = "0.1.89"
@@ -146,6 +196,49 @@ version = "1.5.0"
 source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "c08606f8c3cbf4ce6ec8e28fb0014a2c086708fe954eaa885384a6165172e7e8"
 
+[[package]]
+name = "av-scenechange"
+version = "0.14.1"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "0f321d77c20e19b92c39e7471cf986812cbb46659d2af674adc4331ef3f18394"
+dependencies = [
+ "aligned",
+ "anyhow",
+ "arg_enum_proc_macro",
+ "arrayvec",
+ "log",
+ "num-rational",
+ "num-traits",
+ "pastey",
+ "rayon",
+ "thiserror 2.0.18",
+ "v_frame",
+ "y4m",
+]
+
+[[package]]
+name = "av1-grain"
+version = "0.2.5"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "8cfddb07216410377231960af4fcab838eaa12e013417781b78bd95ee22077f8"
+dependencies = [
+ "anyhow",
+ "arrayvec",
+ "log",
+ "nom 8.0.0",
+ "num-rational",
+ "v_frame",
+]
+
+[[package]]
+name = "avif-serialize"
+version = "0.8.8"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "375082f007bd67184fb9c0374614b29f9aaa604ec301635f72338bb65386a53d"
+dependencies = [
+ "arrayvec",
+]
+
 [[package]]
 name = "aws-lc-rs"
 version = "1.16.2"
@@ -187,6 +280,7 @@ dependencies = [
  "matchit",
  "memchr",
  "mime",
+ "multer",
  "percent-encoding",
  "pin-project-lite",
  "serde_core",
@@ -260,12 +354,27 @@ version = "1.8.3"
 source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "2af50177e190e07a26ab74f8b1efbfe2ef87da2116221318cb1c2e82baf7de06"
 
+[[package]]
+name = "bit_field"
+version = "0.10.3"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "1e4b40c7323adcfc0a41c4b88143ed58346ff65a288fc144329c5c45e05d70c6"
+
 [[package]]
 name = "bitflags"
 version = "2.11.0"
 source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "843867be96c8daad0d758b57df9392b6d8d271134fce549de6ce169ff98a92af"
 
+[[package]]
+name = "bitstream-io"
+version = "4.10.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "7eff00be299a18769011411c9def0d827e8f2d7bf0c3dbf53633147a8867fd1f"
+dependencies = [
+ "no_std_io2",
+]
+
 [[package]]
 name = "block-buffer"
 version = "0.10.4"
@@ -285,6 +394,12 @@ dependencies = [
  "serde",
 ]
 
+[[package]]
+name = "built"
+version = "0.8.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "f4ad8f11f288f48ca24471bbd51ac257aaeaaa07adae295591266b792902ae64"
+
 [[package]]
 name = "bumpalo"
 version = "3.20.2"
@@ -303,11 +418,20 @@ version = "1.5.0"
 source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "1fd0f2584146f6f2ef48085050886acf353beff7305ebd1ae69500e27c67f64b"
 
+[[package]]
+name = "byteorder-lite"
+version = "0.1.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "8f1fe948ff07f4bd06c30984e69f5b4899c516a3ef74f34df92a2df2ab535495"
+
 [[package]]
 name = "bytes"
 version = "1.11.1"
 source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "1e748733b7cbc798e1434b6ac524f0c1ff2ab456fe201501e6497c8417a4fc33"
+dependencies = [
+ "serde",
+]
 
 [[package]]
 name = "castaway"
@@ -471,6 +595,12 @@ dependencies = [
  "regex-lite",
 ]
 
+[[package]]
+name = "color_quant"
+version = "1.1.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "3d7b894f5411737b7867f4827955924d7c254fc9f4d91a6aad6b097804b1018b"
+
 [[package]]
 name = "colorchoice"
 version = "1.0.5"
@@ -599,6 +729,12 @@ version = "0.8.21"
 source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "d0a5c400df2834b80a4c3327b3aad3a4c4cd4de0629063962b03235697506a28"
 
+[[package]]
+name = "crunchy"
+version = "0.2.4"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "460fbee9c2c2f33933d720630a6a0bac33ba7053db5344fac858d4b8952d77d5"
+
 [[package]]
 name = "crypto-common"
 version = "0.1.7"
@@ -819,6 +955,7 @@ dependencies = [
  "anyhow",
  "axum",
  "axum-server",
+ "bytes",
  "clap",
  "clap_derive",
  "codspeed-divan-compat",
@@ -827,6 +964,8 @@ dependencies = [
  "dotenv",
  "figment",
  "flate2",
+ "image",
+ "image-ndarray",
  "mlua",
  "ndarray",
  "ndarray-stats",
@@ -918,6 +1057,26 @@ dependencies = [
  "log",
 ]
 
+[[package]]
+name = "equator"
+version = "0.4.2"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "4711b213838dfee0117e3be6ac926007d7f433d7bbe33595975d4190cb07e6fc"
+dependencies = [
+ "equator-macro",
+]
+
+[[package]]
+name = "equator-macro"
+version = "0.4.2"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "44f23cf4b44bfce11a86ace86f8a73ffdec849c9fd00a386a53d278bd9e81fb3"
+dependencies = [
+ "proc-macro2",
+ "quote",
+ "syn",
+]
+
 [[package]]
 name = "equivalent"
 version = "1.0.2"
@@ -943,12 +1102,42 @@ dependencies = [
  "cc",
 ]
 
+[[package]]
+name = "exr"
+version = "1.74.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "4300e043a56aa2cb633c01af81ca8f699a321879a7854d3896a0ba89056363be"
+dependencies = [
+ "bit_field",
+ "half",
+ "lebe",
+ "miniz_oxide",
+ "rayon-core",
+ "smallvec 1.15.1",
+ "zune-inflate",
+]
+
 [[package]]
 name = "fastrand"
 version = "2.4.1"
 source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "9f1f227452a390804cdb637b74a86990f2a7d7ba4b7d5693aac9b4dd6defd8d6"
 
+[[package]]
+name = "fax"
+version = "0.2.7"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "caf1079563223d5d59d83c85886a56e586cfd5c1a26292e971a0fa266531ac5a"
+
+[[package]]
+name = "fdeflate"
+version = "0.3.7"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "1e6853b52649d4ac5c0bd02320cddc5ba956bdb407c4b75a2c6b75bf51500f8c"
+dependencies = [
+ "simd-adler32",
+]
+
 [[package]]
 name = "figment"
 version = "0.10.19"
@@ -1186,6 +1375,16 @@ dependencies = [
  "wasip3",
 ]
 
+[[package]]
+name = "gif"
+version = "0.14.2"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "ee8cfcc411d9adbbaba82fb72661cc1bcca13e8bba98b364e62b2dba8f960159"
+dependencies = [
+ "color_quant",
+ "weezl",
+]
+
 [[package]]
 name = "glob"
 version = "0.3.3"
@@ -1211,6 +1410,17 @@ dependencies = [
  "tracing",
 ]
 
+[[package]]
+name = "half"
+version = "2.7.1"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "6ea2d84b969582b4b1864a92dc5d27cd2b77b622a8d79306834f1be5ba20d84b"
+dependencies = [
+ "cfg-if",
+ "crunchy",
+ "zerocopy",
+]
+
 [[package]]
 name = "hashbrown"
 version = "0.15.5"
@@ -1492,6 +1702,59 @@ dependencies = [
  "icu_properties",
 ]
 
+[[package]]
+name = "image"
+version = "0.25.10"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "85ab80394333c02fe689eaf900ab500fbd0c2213da414687ebf995a65d5a6104"
+dependencies = [
+ "bytemuck",
+ "byteorder-lite",
+ "color_quant",
+ "exr",
+ "gif",
+ "image-webp",
+ "moxcms",
+ "num-traits",
+ "png",
+ "qoi",
+ "ravif",
+ "rayon",
+ "rgb",
+ "serde",
+ "tiff",
+ "zune-core",
+ "zune-jpeg",
+]
+
+[[package]]
+name = "image-ndarray"
+version = "0.1.5"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "366ec4e7613badea5930852b9fc8781fdbb010a59845a3a5c1cf61d0ccc3f133"
+dependencies = [
+ "image",
+ "ndarray",
+ "num-traits",
+ "thiserror 2.0.18",
+]
+
+[[package]]
+name = "image-webp"
+version = "0.2.4"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "525e9ff3e1a4be2fbea1fdf0e98686a6d98b4d8f937e1bf7402245af1909e8c3"
+dependencies = [
+ "byteorder-lite",
+ "quick-error",
+]
+
+[[package]]
+name = "imgref"
+version = "1.12.1"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "40fac9d56ed6437b198fddba683305e8e2d651aa42647f00f5ae542e7f5c94a2"
+
 [[package]]
 name = "indexmap"
 version = "2.14.0"
@@ -1532,6 +1795,17 @@ version = "0.1.15"
 source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "c8fae54786f62fb2918dcfae3d568594e50eb9b5c25bf04371af6fe7516452fb"
 
+[[package]]
+name = "interpolate_name"
+version = "0.2.4"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "c34819042dc3d3971c46c2190835914dfbe0c3c13f61449b2997f4e9722dfa60"
+dependencies = [
+ "proc-macro2",
+ "quote",
+ "syn",
+]
+
 [[package]]
 name = "ipnet"
 version = "2.12.0"
@@ -1656,12 +1930,28 @@ version = "0.1.0"
 source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "09edd9e8b54e49e587e4f6295a7d29c3ea94d469cb40ab8ca70b288248a81db2"
 
+[[package]]
+name = "lebe"
+version = "0.5.3"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "7a79a3332a6609480d7d0c9eab957bca6b455b91bb84e66d19f5ff66294b85b8"
+
 [[package]]
 name = "libc"
 version = "0.2.185"
 source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "52ff2c0fe9bc6cb6b14a0592c2ff4fa9ceb83eea9db979b0487cd054946a2b8f"
 
+[[package]]
+name = "libfuzzer-sys"
+version = "0.4.12"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "f12a681b7dd8ce12bff52488013ba614b869148d54dd79836ab85aafdd53f08d"
+dependencies = [
+ "arbitrary",
+ "cc",
+]
+
 [[package]]
 name = "libredox"
 version = "0.1.16"
@@ -1701,6 +1991,15 @@ version = "0.4.29"
 source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "5e5032e24019045c762d3c0f28f5b6b8bbf38563a65908389bf7978758920897"
 
+[[package]]
+name = "loop9"
+version = "0.1.5"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "0fae87c125b03c1d2c0150c90365d7d6bcc53fb73a9acaef207d2d065860f062"
+dependencies = [
+ "imgref",
+]
+
 [[package]]
 name = "lru-slab"
 version = "0.1.2"
@@ -1767,6 +2066,16 @@ dependencies = [
  "rawpointer",
 ]
 
+[[package]]
+name = "maybe-rayon"
+version = "0.1.1"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "8ea1f30cedd69f0a2954655f7188c6a834246d2bcf1e315e2ac40c4b24dc9519"
+dependencies = [
+ "cfg-if",
+ "rayon",
+]
+
 [[package]]
 name = "memchr"
 version = "2.8.0"
@@ -1867,6 +2176,33 @@ dependencies = [
  "syn",
 ]
 
+[[package]]
+name = "moxcms"
+version = "0.8.1"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "bb85c154ba489f01b25c0d36ae69a87e4a1c73a72631fc6c0eb6dde34a73e44b"
+dependencies = [
+ "num-traits",
+ "pxfm",
+]
+
+[[package]]
+name = "multer"
+version = "3.1.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "83e87776546dc87511aa5ee218730c92b666d7264ab6ed41f9d215af9cd5224b"
+dependencies = [
+ "bytes",
+ "encoding_rs",
+ "futures-util",
+ "http",
+ "httparse",
+ "memchr",
+ "mime",
+ "spin",
+ "version_check",
+]
+
 [[package]]
 name = "multimap"
 version = "0.10.1"
@@ -1920,6 +2256,12 @@ dependencies = [
  "rand 0.8.5",
 ]
 
+[[package]]
+name = "new_debug_unreachable"
+version = "1.0.6"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "650eef8c711430f1a879fdd01d4745a7deea475becfb90269c06775983bbf086"
+
 [[package]]
 name = "nix"
 version = "0.31.2"
@@ -1932,6 +2274,15 @@ dependencies = [
  "libc",
 ]
 
+[[package]]
+name = "no_std_io2"
+version = "0.9.3"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "b51ed7824b6e07d354605f4abb3d9d300350701299da96642ee084f5ce631550"
+dependencies = [
+ "memchr",
+]
+
 [[package]]
 name = "noisy_float"
 version = "0.2.1"
@@ -1951,6 +2302,21 @@ dependencies = [
  "minimal-lexical",
 ]
 
+[[package]]
+name = "nom"
+version = "8.0.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "df9761775871bdef83bee530e60050f7e54b1105350d6884eb0fb4f46c2f9405"
+dependencies = [
+ "memchr",
+]
+
+[[package]]
+name = "noop_proc_macro"
+version = "0.3.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "0676bb32a98c1a483ce53e500a81ad9c3d5b3f7c920c28c24e9cb0980d0b5bc8"
+
 [[package]]
 name = "nu-ansi-term"
 version = "0.50.3"
@@ -1960,6 +2326,16 @@ dependencies = [
  "windows-sys 0.61.2",
 ]
 
+[[package]]
+name = "num-bigint"
+version = "0.4.6"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "a5e44f723f1133c9deac646763579fdb3ac745e418f2a7af9cd0c431da1f20b9"
+dependencies = [
+ "num-integer",
+ "num-traits",
+]
+
 [[package]]
 name = "num-complex"
 version = "0.4.6"
@@ -1969,6 +2345,17 @@ dependencies = [
  "num-traits",
 ]
 
+[[package]]
+name = "num-derive"
+version = "0.4.2"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "ed3955f1a9c7c0c15e092f9c887db08b1fc683305fdf6eb6684f22555355e202"
+dependencies = [
+ "proc-macro2",
+ "quote",
+ "syn",
+]
+
 [[package]]
 name = "num-integer"
 version = "0.1.46"
@@ -1978,6 +2365,17 @@ dependencies = [
  "num-traits",
 ]
 
+[[package]]
+name = "num-rational"
+version = "0.4.2"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "f83d14da390562dca69fc84082e73e548e1ad308d24accdedd2720017cb37824"
+dependencies = [
+ "num-bigint",
+ "num-integer",
+ "num-traits",
+]
+
 [[package]]
 name = "num-traits"
 version = "0.2.19"
@@ -2216,6 +2614,12 @@ version = "1.0.15"
 source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "57c0d7b74b563b49d38dae00a0c37d4d6de9b432382b2892f0574ddcae73fd0a"
 
+[[package]]
+name = "pastey"
+version = "0.1.1"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "35fb2e5f958ec131621fdd531e9fc186ed768cbe395337403ae56c17a74c68ec"
+
 [[package]]
 name = "pear"
 version = "0.2.9"
@@ -2303,6 +2707,19 @@ version = "0.2.3"
 source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "b4596b6d070b27117e987119b4dac604f3c58cfb0b191112e24771b2faeac1a6"
 
+[[package]]
+name = "png"
+version = "0.18.1"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "60769b8b31b2a9f263dae2776c37b1b28ae246943cf719eb6946a1db05128a61"
+dependencies = [
+ "bitflags",
+ "crc32fast",
+ "fdeflate",
+ "flate2",
+ "miniz_oxide",
+]
+
 [[package]]
 name = "portable-atomic"
 version = "1.13.1"
@@ -2377,6 +2794,25 @@ dependencies = [
  "yansi",
 ]
 
+[[package]]
+name = "profiling"
+version = "1.0.17"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "3eb8486b569e12e2c32ad3e204dbaba5e4b5b216e9367044f25f1dba42341773"
+dependencies = [
+ "profiling-procmacros",
+]
+
+[[package]]
+name = "profiling-procmacros"
+version = "1.0.17"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "52717f9a02b6965224f95ca2a81e2e0c5c43baacd28ca057577988930b6c3d5b"
+dependencies = [
+ "quote",
+ "syn",
+]
+
 [[package]]
 name = "prost"
 version = "0.14.3"
@@ -2450,6 +2886,12 @@ dependencies = [
  "pulldown-cmark",
 ]
 
+[[package]]
+name = "pxfm"
+version = "0.1.29"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "e0c5ccf5294c6ccd63a74f1565028353830a9c2f5eb0c682c355c471726a6e3f"
+
 [[package]]
 name = "pyo3"
 version = "0.27.2"
@@ -2511,6 +2953,21 @@ dependencies = [
  "syn",
 ]
 
+[[package]]
+name = "qoi"
+version = "0.4.1"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "7f6d64c71eb498fe9eae14ce4ec935c555749aef511cca85b5568910d6e48001"
+dependencies = [
+ "bytemuck",
+]
+
+[[package]]
+name = "quick-error"
+version = "2.0.1"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "a993555f31e5a609f617c12db6250dedcac1b0a85076912c436e6fc9b2c8e6a3"
+
 [[package]]
 name = "quinn"
 version = "0.11.9"
@@ -2647,6 +3104,56 @@ dependencies = [
  "getrandom 0.3.4",
 ]
 
+[[package]]
+name = "rav1e"
+version = "0.8.1"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "43b6dd56e85d9483277cde964fd1bdb0428de4fec5ebba7540995639a21cb32b"
+dependencies = [
+ "aligned-vec",
+ "arbitrary",
+ "arg_enum_proc_macro",
+ "arrayvec",
+ "av-scenechange",
+ "av1-grain",
+ "bitstream-io",
+ "built",
+ "cfg-if",
+ "interpolate_name",
+ "itertools 0.14.0",
+ "libc",
+ "libfuzzer-sys",
+ "log",
+ "maybe-rayon",
+ "new_debug_unreachable",
+ "noop_proc_macro",
+ "num-derive",
+ "num-traits",
+ "paste",
+ "profiling",
+ "rand 0.9.3",
+ "rand_chacha 0.9.0",
+ "simd_helpers",
+ "thiserror 2.0.18",
+ "v_frame",
+ "wasm-bindgen",
+]
+
+[[package]]
+name = "ravif"
+version = "0.13.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "e52310197d971b0f5be7fe6b57530dcd27beb35c1b013f29d66c1ad73fbbcc45"
+dependencies = [
+ "avif-serialize",
+ "imgref",
+ "loop9",
+ "quick-error",
+ "rav1e",
+ "rayon",
+ "rgb",
+]
+
 [[package]]
 name = "rawpointer"
 version = "0.2.1"
@@ -2852,6 +3359,12 @@ dependencies = [
  "web-sys",
 ]
 
+[[package]]
+name = "rgb"
+version = "0.8.53"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "47b34b781b31e5d73e9fbc8689c70551fd1ade9a19e3e28cfec8580a79290cc4"
+
 [[package]]
 name = "ring"
 version = "0.17.14"
@@ -3237,6 +3750,15 @@ version = "0.3.9"
 source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "703d5c7ef118737c72f1af64ad2f6f8c5e1921f818cdcb97b8fe6fc69bf66214"
 
+[[package]]
+name = "simd_helpers"
+version = "0.1.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "95890f873bec569a0362c235787f3aca6e1e887302ba4840839bcc6459c42da6"
+dependencies = [
+ "quote",
+]
+
 [[package]]
 name = "slab"
 version = "0.4.12"
@@ -3276,6 +3798,12 @@ dependencies = [
  "winapi",
 ]
 
+[[package]]
+name = "spin"
+version = "0.9.8"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "6980e8d7511241f8acf4aebddbb1ff938df5eebe98691418c4468d0b72a96a67"
+
 [[package]]
 name = "spm_precompiled"
 version = "0.1.4"
@@ -3283,7 +3811,7 @@ source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "5851699c4033c63636f7ea4cf7b7c1f1bf06d0cc03cfb42e711de5a5c46cf326"
 dependencies = [
  "base64 0.13.1",
- "nom",
+ "nom 7.1.3",
  "serde",
  "unicode-segmentation",
 ]
@@ -3498,6 +4026,20 @@ dependencies = [
  "cfg-if",
 ]
 
+[[package]]
+name = "tiff"
+version = "0.11.3"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "b63feaf3343d35b6ca4d50483f94843803b0f51634937cc2ec519fc32232bc52"
+dependencies = [
+ "fax",
+ "flate2",
+ "half",
+ "quick-error",
+ "weezl",
+ "zune-jpeg",
+]
+
 [[package]]
 name = "tinystr"
 version = "0.8.3"
@@ -4071,6 +4613,17 @@ dependencies = [
  "wasm-bindgen",
 ]
 
+[[package]]
+name = "v_frame"
+version = "0.3.9"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "666b7727c8875d6ab5db9533418d7c764233ac9c0cff1d469aec8fa127597be2"
+dependencies = [
+ "aligned-vec",
+ "num-traits",
+ "wasm-bindgen",
+]
+
 [[package]]
 name = "valuable"
 version = "0.1.1"
@@ -4272,6 +4825,12 @@ dependencies = [
  "rustls-pki-types",
 ]
 
+[[package]]
+name = "weezl"
+version = "0.1.12"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "a28ac98ddc8b9274cb41bb4d9d4d5c425b6020c50c46f25559911905610b4a88"
+
 [[package]]
 name = "which"
 version = "8.0.2"
@@ -4726,6 +5285,12 @@ dependencies = [
  "rustix",
 ]
 
+[[package]]
+name = "y4m"
+version = "0.8.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "7a5a4b21e1a62b67a2970e6831bc091d7b87e119e7f9791aef9702e3bef04448"
+
 [[package]]
 name = "yansi"
 version = "1.0.1"
@@ -4840,3 +5405,27 @@ name = "zmij"
 version = "1.0.21"
 source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "b8848ee67ecc8aedbaf3e4122217aff892639231befc6a1b58d29fff4c2cabaa"
+
+[[package]]
+name = "zune-core"
+version = "0.5.1"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "cb8a0807f7c01457d0379ba880ba6322660448ddebc890ce29bb64da71fb40f9"
+
+[[package]]
+name = "zune-inflate"
+version = "0.2.54"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "73ab332fe2f6680068f3582b16a24f90ad7096d5d39b974d1c0aff0125116f02"
+dependencies = [
+ "simd-adler32",
+]
+
+[[package]]
+name = "zune-jpeg"
+version = "0.5.15"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "27bc9d5b815bc103f142aa054f561d9187d191692ec7c2d1e2b4737f8dbd7296"
+dependencies = [
+ "zune-core",
+]
diff --git a/Cargo.toml b/Cargo.toml
index 7f7b8059..ecea85cd 100644
--- a/Cargo.toml
+++ b/Cargo.toml
@@ -14,6 +14,15 @@ ndarray = "0.16.1"
 serde = { version = "1.0.228", features = ["serde_derive"] }
 tracing = "0.1.41"
 thiserror = "2.0.17"
+image-ndarray = "0.1.5"
+
+[workspace.dependencies.bytes]
+version = "1.11.1"
+features = ["serde"]
+
+[workspace.dependencies.image]
+version = "0.25.10"
+features = ["serde"]
 
 [workspace.dependencies.parking_lot]
 version = "0.12.5"
diff --git a/encoderfile-runtime/src/main.rs b/encoderfile-runtime/src/main.rs
index 003d7d42..07dbe0f7 100644
--- a/encoderfile-runtime/src/main.rs
+++ b/encoderfile-runtime/src/main.rs
@@ -1,19 +1,16 @@
 use parking_lot::Mutex;
 use std::{
-    fs::File,
-    io::{BufReader, Read, Seek},
-    sync::Arc,
+    error::Error, fs::File, io::{BufReader, Read, Seek, Error as IOError, ErrorKind}, sync::Arc,
 };
 
 use anyhow::Result;
 use clap::Parser;
 use encoderfile::{
-    common::{
-        ModelType,
-        model_type::{Embedding, SentenceEmbedding, SequenceClassification, TokenClassification},
-    },
-    runtime::{EncoderfileLoader, EncoderfileState, load_assets},
-    transport::cli::Cli,
+    common::{ModelConfig, model_type::{
+        Embedding, ImageClassification, ModelType, SentenceEmbedding, SequenceClassification, TokenClassification
+    }},
+    runtime::{ClassifierState, EncoderfileLoader, EncoderfileState, FeatureExtractorState, ImageInputState, TextInputState, load_assets},
+    transport::cli::{TextCli, ImageCli},
 };
 
 #[tokio::main]
@@ -30,49 +27,78 @@ async fn main() -> Result<()> {
 }
 
 macro_rules! run_cli {
-    ($model_type:ident, $cli:expr, $config:expr, $session:expr, $tokenizer:expr, $model_config:expr) => {{
+    ($model_type:ident, $cli:expr, $config:expr, $session:expr, $input_state:expr, $task_state:expr) => {{
         let state = Arc::new(EncoderfileState::<$model_type>::new(
             $config,
             $session,
-            $tokenizer,
-            $model_config,
+            $input_state,
+            $task_state,
         ));
         $cli.command.execute(state).await
     }};
 }
 
 async fn entrypoint<'a, R: Read + Seek>(loader: &mut EncoderfileLoader<'a, R>) -> Result<()> {
-    let cli = Cli::parse();
     let session = Mutex::new(loader.session()?);
     let model_config = loader.model_config()?;
-    let tokenizer = loader.tokenizer()?;
     let config = loader.encoderfile_config()?;
+    // TODO clear out lifetimes in state and loader to avoid
+
+    fn class_task_state(model_config: &ModelConfig) -> ClassifierState {
+        // if num_labels, make a vector of labels
+        // if id2label, make sure it's 0..n-1
+        ClassifierState {
+            id2label: model_config.id2label.clone(),
+            label2id: model_config.label2id.clone(),
+            num_labels: model_config.num_labels,
+        }
+    }
 
     match loader.model_type() {
-        ModelType::Embedding => run_cli!(Embedding, cli, config, session, tokenizer, model_config),
+        ModelType::Embedding => run_cli!(
+            Embedding,
+            TextCli::parse(),
+            config,
+            session,
+            TextInputState { tokenizer: loader.tokenizer()?, model_config },
+            FeatureExtractorState {}
+        ),
         ModelType::SequenceClassification => run_cli!(
             SequenceClassification,
-            cli,
+            TextCli::parse(),
             config,
             session,
-            tokenizer,
-            model_config
+            TextInputState { tokenizer: loader.tokenizer()?, model_config: model_config.clone() },
+            class_task_state(&model_config)
         ),
         ModelType::TokenClassification => run_cli!(
             TokenClassification,
-            cli,
+            TextCli::parse(),
             config,
             session,
-            tokenizer,
-            model_config
+            TextInputState { tokenizer: loader.tokenizer()?, model_config: model_config.clone() },
+            class_task_state(&model_config)
         ),
         ModelType::SentenceEmbedding => run_cli!(
             SentenceEmbedding,
-            cli,
+            TextCli::parse(),
+            config,
+            session,
+            TextInputState { tokenizer: loader.tokenizer()?, model_config },
+            FeatureExtractorState {}
+        ),
+        ModelType::ImageClassification => run_cli!(
+            ImageClassification,
+            ImageCli::parse(),
             config,
             session,
-            tokenizer,
-            model_config
+            ImageInputState { 
+                height: model_config.height(),
+                width: model_config.width(),
+                num_channels: model_config.num_channels().ok_or(IOError::new(ErrorKind::InvalidData, "Missing required configuration field"))?,
+                image_size: model_config.image_size,
+            },
+            class_task_state(&model_config)
         ),
     }
 }
diff --git a/encoderfile/Cargo.toml b/encoderfile/Cargo.toml
index 90c45150..2ea2eac3 100644
--- a/encoderfile/Cargo.toml
+++ b/encoderfile/Cargo.toml
@@ -139,9 +139,18 @@ workspace = true
 [dependencies.serde_json]
 workspace = true
 
+[dependencies.bytes]
+workspace = true
+
 [dependencies.ndarray]
 workspace = true
 
+[dependencies.image]
+workspace = true
+
+[dependencies.image-ndarray]
+workspace = true
+
 [dependencies.figment]
 version = "0.10.19"
 features = ["env", "serde_yaml", "yaml"]
@@ -211,6 +220,7 @@ optional = true
 
 [dependencies.axum]
 version = "0.8.6"
+features = ["multipart"]
 optional = true
 
 [dependencies.axum-server]
diff --git a/encoderfile/benches/postprocessing.rs b/encoderfile/benches/postprocessing.rs
index dbb66816..bcd1053e 100644
--- a/encoderfile/benches/postprocessing.rs
+++ b/encoderfile/benches/postprocessing.rs
@@ -16,7 +16,7 @@ fn main() {
 
 #[divan::bench(args = [(8, 16, 384), (16, 128, 768), (64, 512, 1024)])]
 fn embedding_postprocess(b: Bencher, dim: (usize, usize, usize)) {
-    let tokenizer = &embedding_state().tokenizer;
+    let tokenizer = &embedding_state().per_model_input_state.tokenizer;
     let (batch, tokens, hidden) = dim;
 
     // Random embeddings
@@ -35,7 +35,7 @@ fn embedding_postprocess(b: Bencher, dim: (usize, usize, usize)) {
 #[divan::bench(args = [8, 16, 64])]
 fn sequence_classification_postprocess(b: Bencher, batch: usize) {
     let state = sequence_classification_state();
-    let config = &state.model_config;
+    let config = &state.per_task_state;
     let n_labels = config.id2label.clone().unwrap().len();
 
     let mut rng = rand::rng();
@@ -51,10 +51,10 @@ fn sequence_classification_postprocess(b: Bencher, batch: usize) {
 #[divan::bench(args = [(8, 16), (16, 128), (64, 512)])]
 fn token_classification_postprocess(b: Bencher, dim: (usize, usize)) {
     let state = token_classification_state();
-    let config = &state.model_config;
+    let config = &state.per_task_state;
     let n_labels = config.id2label.clone().unwrap().len();
 
-    let tokenizer = &embedding_state().tokenizer;
+    let tokenizer = &embedding_state().per_model_input_state.tokenizer;
     let (batch, tokens) = dim;
 
     // Random embeddings
diff --git a/encoderfile/build.rs b/encoderfile/build.rs
index 7ecdf96c..016ed527 100644
--- a/encoderfile/build.rs
+++ b/encoderfile/build.rs
@@ -12,14 +12,18 @@ fn main() -> Result<(), Box<dyn std::error::Error>> {
                 "proto/sequence_classification.proto",
                 "proto/token_classification.proto",
                 "proto/sentence_embedding.proto",
+                "proto/image_classification.proto",
                 "proto/manifest.proto",
+                "proto/image_types.proto",
             ],
             &[
                 "proto/embedding",
                 "proto/sequence_classification",
                 "proto/token_classification",
                 "proto/sentence_embedding",
+                "proto/image_classification",
                 "proto/manifest",
+                "proto/image_types",
             ],
         )?;
 
diff --git a/encoderfile/proto/image_classification.proto b/encoderfile/proto/image_classification.proto
new file mode 100644
index 00000000..af028275
--- /dev/null
+++ b/encoderfile/proto/image_classification.proto
@@ -0,0 +1,21 @@
+syntax = "proto3";
+
+package encoderfile.image_classification;
+
+import "proto/metadata.proto";
+import "proto/image_types.proto";
+
+service ImageClassificationInference {
+  rpc Predict(ImageClassificationRequest) returns (ImageClassificationResponse);
+  rpc GetModelMetadata(encoderfile.metadata.GetModelMetadataRequest) returns (encoderfile.metadata.GetModelMetadataResponse);
+}
+
+message ImageClassificationRequest {
+  repeated encoderfile.image_types.ImageInput inputs = 1;
+  map<string, string> metadata = 11;
+}
+
+message ImageClassificationResponse {
+  repeated encoderfile.image_types.ImageLabels labels = 1;
+  map<string, string> metadata = 11;
+}
diff --git a/encoderfile/proto/image_segmentation.proto b/encoderfile/proto/image_segmentation.proto
new file mode 100644
index 00000000..bea6d600
--- /dev/null
+++ b/encoderfile/proto/image_segmentation.proto
@@ -0,0 +1,30 @@
+syntax = "proto3";
+
+package encoderfile.image_segmentation;
+
+import "proto/token.proto";
+import "proto/metadata.proto";
+
+service ImageSegmentation {
+  rpc Predict(ImageSegmentationRequest) returns (ImageSegmentationResponse);
+  rpc GetModelMetadata(encoderfile.metadata.GetModelMetadataRequest) returns (encoderfile.metadata.GetModelMetadataResponse);
+}
+
+message ImageSegmentationRequest {
+  repeated encoderfile.image_types.ImageInput images = 1;
+  map<string, string> metadata = 11;
+}
+
+message ImageSegment {
+  encoderfile.image_types.ImageLabelScore label = 1;
+  bytes mask = 2;
+}
+
+message ImageSegments {
+  repeated ImageSegment segments = 1;
+}
+
+message ImageSegmentationResponse {
+  repeated ImageSegments segments_batch = 1;
+  map<string, string> metadata = 11;
+}
diff --git a/encoderfile/proto/image_types.proto b/encoderfile/proto/image_types.proto
new file mode 100644
index 00000000..ffcd4c3c
--- /dev/null
+++ b/encoderfile/proto/image_types.proto
@@ -0,0 +1,16 @@
+syntax = "proto3";
+
+package encoderfile.image_types;
+
+message ImageInput {
+  bytes image = 1;
+}
+
+message ImageLabelScore {
+  string label = 1;
+  optional float score = 2;
+}
+
+message ImageLabels {
+  repeated ImageLabelScore labels = 1;
+}
diff --git a/encoderfile/proto/metadata.proto b/encoderfile/proto/metadata.proto
index de67f847..25e14f33 100644
--- a/encoderfile/proto/metadata.proto
+++ b/encoderfile/proto/metadata.proto
@@ -6,6 +6,7 @@ message GetModelMetadataRequest {}
 
 message GetModelMetadataResponse {
   string model_id = 1;
+  // TODO decide if we want a model family/area at a higher level
   ModelType model_type = 2;
   map<uint32, string> id2label = 3;
 }
@@ -16,4 +17,8 @@ enum ModelType {
   SEQUENCE_CLASSIFICATION = 2;
   TOKEN_CLASSIFICATION = 3;
   SENTENCE_EMBEDDING = 4;
+
+  IMAGE_CLASSIFICATION = 21;
+  // IMAGE_SEGMENTATION = 22;
+  // OBJECT_DETECTION = 23;
 }
diff --git a/encoderfile/proto/object_detection.proto b/encoderfile/proto/object_detection.proto
new file mode 100644
index 00000000..a55b4d85
--- /dev/null
+++ b/encoderfile/proto/object_detection.proto
@@ -0,0 +1,33 @@
+syntax = "proto3";
+
+package encoderfile.object_detection;
+
+import "proto/token.proto";
+import "proto/metadata.proto";
+
+service ObjectDetection {
+  rpc Predict(ObjectDetectionRequest) returns (ObjectDetectionResponse);
+  rpc GetModelMetadata(encoderfile.metadata.GetModelMetadataRequest) returns (encoderfile.metadata.GetModelMetadataResponse);
+}
+
+message ObjectDetectionRequest {
+  repeated encoderfile.image_types.ImageInput inputs = 1;
+  map<string, string> metadata = 11;
+}
+
+message ImageBoundingBox {
+  encoderfile.image_types.ImageLabelScore label = 1;
+  xmin int32 = 2;
+  xmax int32 = 3;
+  ymin int32 = 4;
+  ymax int32 = 5;
+}
+
+message ImageBoundingBoxes {
+  repeated ImageBoundingBox box = 1;
+}
+
+message ObjectDetectionResponse {
+  repeated ImageBoundingBoxes boxes = 1;
+  map<string, string> metadata = 11;
+}
diff --git a/encoderfile/proto/sentence_embedding.proto b/encoderfile/proto/sentence_embedding.proto
index f7afc989..b14a72a7 100644
--- a/encoderfile/proto/sentence_embedding.proto
+++ b/encoderfile/proto/sentence_embedding.proto
@@ -2,7 +2,6 @@ syntax = "proto3";
 
 package encoderfile.sentence_embedding;
 
-import "proto/token.proto";
 import "proto/metadata.proto";
 
 service SentenceEmbeddingInference {
diff --git a/encoderfile/src/builder/builder.rs b/encoderfile/src/builder/builder.rs
index 00a819ae..f87e236d 100644
--- a/encoderfile/src/builder/builder.rs
+++ b/encoderfile/src/builder/builder.rs
@@ -17,8 +17,10 @@ use crate::{
         codec::EncoderfileCodec,
     },
     generated::manifest::Backend,
+    runtime::{InputType, Input}
 };
 use anyhow::{Context, Result};
+use ort::session::input;
 use serde::{Deserialize, Serialize};
 
 #[derive(Debug, Serialize, Deserialize)]
@@ -27,6 +29,11 @@ pub struct EncoderfileBuilder {
     pub config: BuildConfig,
 }
 
+pub fn validate(input: &Input) -> Result<()> { 
+    Ok(())
+}
+
+
 impl EncoderfileBuilder {
     pub fn new(config: BuildConfig) -> EncoderfileBuilder {
         Self { config }
@@ -90,10 +97,12 @@ impl EncoderfileBuilder {
         }
 
         // validate tokenizer
-        let tokenizer_asset =
-            crate::builder::tokenizer::validate_tokenizer(&self.config.encoderfile)?;
-        planned_assets.push(tokenizer_asset);
-        terminal::success("Tokenizer validated");
+        if self.config.encoderfile.model_type.input_type() == crate::runtime::Input::Text {
+            let tokenizer_asset =
+                crate::builder::tokenizer::validate_tokenizer(&self.config.encoderfile)?;
+            planned_assets.push(tokenizer_asset);
+            terminal::success("Tokenizer validated");
+        }
 
         // initialize final binary
         terminal::info("Writing encoderfile...");
diff --git a/encoderfile/src/builder/config.rs b/encoderfile/src/builder/config.rs
index d57c3b68..b967401e 100644
--- a/encoderfile/src/builder/config.rs
+++ b/encoderfile/src/builder/config.rs
@@ -1,4 +1,6 @@
-use crate::common::{Config as EmbeddedConfig, LuaLibs, ModelConfig, ModelType};
+use crate::common::{Config as EmbeddedConfig, LuaLibs, ModelConfig, model_type::ModelType};
+use crate::runtime::TaskType;
+use crate::runtime::InputType;
 use anyhow::{Context, Result, bail};
 use schemars::JsonSchema;
 use std::string::String;
@@ -24,7 +26,7 @@ pub struct BuildConfig {
     pub encoderfile: EncoderfileConfig,
 }
 
-pub const DEFAULT_VERSION: &str = "0.1.0";
+pub const DEFAULT_VERSION: &str = "0.2.0";
 
 pub const CONFIG_FILE_NOT_FOUND_MSG: &str = "Encoderfile config not found";
 
@@ -271,6 +273,8 @@ pub enum ModelPath {
     },
 }
 
+
+
 impl ModelPath {
     fn resolve(
         &self,
diff --git a/encoderfile/src/builder/model.rs b/encoderfile/src/builder/model.rs
index 77e9cf29..fb12c815 100644
--- a/encoderfile/src/builder/model.rs
+++ b/encoderfile/src/builder/model.rs
@@ -10,7 +10,7 @@ pub trait ModelTypeExt {
     fn validate_model<'a>(&self, path: &'a Path) -> Result<PlannedAsset<'a>>;
 }
 
-impl ModelTypeExt for crate::common::ModelType {
+impl ModelTypeExt for crate::common::model_type::ModelType {
     fn validate_model<'a>(&self, path: &'a Path) -> Result<PlannedAsset<'a>> {
         let model = load_model(path)?;
 
@@ -19,6 +19,7 @@ impl ModelTypeExt for crate::common::ModelType {
             Self::SequenceClassification => validate_sequence_classification_model(model),
             Self::TokenClassification => validate_token_classification_model(model),
             Self::SentenceEmbedding => validate_sentence_embedding_model(model),
+            Self::ImageClassification => validate_image_classification_model(model),
         }?;
 
         PlannedAsset::from_asset_source(AssetSource::File(path), AssetKind::ModelWeights)
@@ -65,6 +66,16 @@ fn validate_token_classification_model(model: Session) -> Result<()> {
     Ok(())
 }
 
+fn validate_image_classification_model(model: Session) -> Result<()> {
+    let shape = get_outp_dim(model.outputs.as_slice(), "logits")?;
+
+    if shape.len() != 2 {
+        bail!("Model must return tensor of shape [batch_size, n_labels]")
+    }
+
+    Ok(())
+}
+
 fn get_outp_dim<'a>(outputs: &'a [Output], outp_name: &str) -> Result<&'a Shape> {
     outputs
         .iter()
diff --git a/encoderfile/src/builder/tokenizer.rs b/encoderfile/src/builder/tokenizer.rs
index cc472a7d..bfabf14a 100644
--- a/encoderfile/src/builder/tokenizer.rs
+++ b/encoderfile/src/builder/tokenizer.rs
@@ -348,7 +348,7 @@ impl<'a> TokenizerConfigBuilder<'a> {
 #[cfg(test)]
 mod tests {
     use crate::builder::config::{ModelPath, TokenizerBuildConfig};
-    use crate::common::ModelType;
+    use crate::common::model_type::ModelType;
 
     use super::*;
 
diff --git a/encoderfile/src/builder/transforms/validation/embedding.rs b/encoderfile/src/builder/transforms/validation/embedding.rs
index 20785c07..83a48784 100644
--- a/encoderfile/src/builder/transforms/validation/embedding.rs
+++ b/encoderfile/src/builder/transforms/validation/embedding.rs
@@ -56,7 +56,7 @@ impl TransformValidatorExt for EmbeddingTransform {
 #[cfg(test)]
 mod tests {
     use crate::builder::config::{EncoderfileConfig, ModelPath};
-    use crate::common::ModelType;
+    use crate::common::model_type::ModelType;
     use crate::transforms::DEFAULT_LIBS;
 
     use super::*;
diff --git a/encoderfile/src/builder/transforms/validation/image_classification.rs b/encoderfile/src/builder/transforms/validation/image_classification.rs
new file mode 100644
index 00000000..1ec5ebab
--- /dev/null
+++ b/encoderfile/src/builder/transforms/validation/image_classification.rs
@@ -0,0 +1,129 @@
+use super::{
+    TransformValidatorExt,
+    utils::{BATCH_SIZE, SEQ_LEN, random_tensor, validation_err, validation_err_ctx},
+};
+use crate::{
+    common::ModelConfig,
+    transforms::{ImageClassificationTransform, Postprocessor},
+};
+use anyhow::{Context, Result};
+
+impl TransformValidatorExt for ImageClassificationTransform {
+    fn dry_run(&self, model_config: &ModelConfig) -> Result<()> {
+        let num_labels = match model_config.num_labels() {
+            Some(n) => n,
+            None => validation_err(
+                "Model config does not have `num_labels`, `id2label`, or `label2id` field. Please make sure you're using an ImageClassification model.",
+            )?,
+        };
+
+        let dummy_logits = random_tensor(&[BATCH_SIZE, SEQ_LEN, num_labels], (-1.0, 1.0))?;
+        let shape = dummy_logits.shape().to_owned();
+
+        let res = self.postprocess(dummy_logits)
+            .with_context(|| {
+                validation_err_ctx(
+                    format!(
+                        "Failed to run postprocessing on dummy logits (randomly generated in range -1.0..1.0) of shape {:?}",
+                        shape.as_slice(),
+                    )
+                )
+            })?;
+
+        // result must return tensor of rank 2
+        if res.ndim() != 2 {
+            validation_err(format!(
+                "Transform must return tensor of rank 2. Got tensor of shape {:?}.",
+                res.shape()
+            ))?
+        }
+
+        // result must have same shape as original
+        if res.shape() != shape {
+            validation_err(format!(
+                "Transform must return Tensor of shape [batch_size, num_labels]. Expected shape [{}, {}], got shape {:?}",
+                BATCH_SIZE,
+                num_labels,
+                res.shape()
+            ))?
+        }
+
+        Ok(())
+    }
+}
+
+#[cfg(test)]
+mod tests {
+    use crate::builder::config::{EncoderfileConfig, ModelPath};
+    use crate::common::model_type::ModelType;
+    use crate::transforms::DEFAULT_LIBS;
+
+    use super::*;
+
+    fn test_encoderfile_config() -> EncoderfileConfig {
+        EncoderfileConfig {
+            name: "my-model".to_string(),
+            version: "0.0.1".to_string(),
+            path: ModelPath::Directory(std::path::PathBuf::from("models/image_classification")),
+            model_type: ModelType::ImageClassification,
+            cache_dir: None,
+            output_path: None,
+            transform: None,
+            lua_libs: None,
+            validate_transform: true,
+            tokenizer: None,
+            base_binary_path: None,
+            target: None,
+        }
+    }
+
+    fn test_model_config() -> ModelConfig {
+        let config_json = include_str!("../../../../../models/token_classification/config.json");
+
+        serde_json::from_str(config_json).unwrap()
+    }
+
+    #[test]
+    fn test_identity_validation() {
+        let encoderfile_config = test_encoderfile_config();
+        let model_config = test_model_config();
+
+        ImageClassificationTransform::new(
+            DEFAULT_LIBS.to_vec(),
+            Some("function Postprocess(arr) return arr end".to_string()),
+        )
+        .expect("Failed to create transform")
+        .validate(&encoderfile_config, &model_config)
+        .expect("Failed to validate");
+    }
+
+    #[test]
+    fn test_bad_return_type() {
+        let encoderfile_config = test_encoderfile_config();
+        let model_config = test_model_config();
+
+        let result = ImageClassificationTransform::new(
+            DEFAULT_LIBS.to_vec(),
+            Some("function Postprocess(arr) return 1 end".to_string()),
+        )
+        .expect("Failed to create transform")
+        .validate(&encoderfile_config, &model_config);
+
+        assert!(result.is_err());
+    }
+
+    #[test]
+    fn test_bad_dimensionality() {
+        let encoderfile_config = test_encoderfile_config();
+        let model_config = test_model_config();
+
+        let result = ImageClassificationTransform::new(
+            DEFAULT_LIBS.to_vec(),
+            Some("function Postprocess(arr) return arr:sum_axis(1) end".to_string()),
+        )
+        .expect("Failed to create transform")
+        .validate(&encoderfile_config, &model_config);
+
+        assert!(result.is_err());
+    }
+}
diff --git a/encoderfile/src/builder/transforms/validation/mod.rs b/encoderfile/src/builder/transforms/validation/mod.rs
index 8d1a3783..39089444 100644
--- a/encoderfile/src/builder/transforms/validation/mod.rs
+++ b/encoderfile/src/builder/transforms/validation/mod.rs
@@ -1,5 +1,5 @@
 use crate::{
-    common::{ModelConfig, ModelType},
+    common::{ModelConfig, model_type::ModelType},
     format::assets::{AssetKind, AssetSource, PlannedAsset},
     generated::manifest::LuaLibs as ManifestLuaLibs,
     transforms::{TransformSpec, convert_libs},
@@ -13,6 +13,7 @@ mod embedding;
 mod sentence_embedding;
 mod sequence_classification;
 mod token_classification;
+mod image_classification;
 mod utils;
 
 pub trait TransformValidatorExt: TransformSpec {
@@ -89,6 +90,12 @@ pub fn validate_transform<'a>(
             encoderfile_config,
             model_config
         ),
+        ModelType::ImageClassification => validate_transform!(
+            ImageClassificationTransform,
+            transform_str,
+            encoderfile_config,
+            model_config
+        ),
     }?;
 
     let lua_libs: Option<ManifestLuaLibs> = encoderfile_config
diff --git a/encoderfile/src/builder/transforms/validation/sentence_embedding.rs b/encoderfile/src/builder/transforms/validation/sentence_embedding.rs
index e478927d..22beda8b 100644
--- a/encoderfile/src/builder/transforms/validation/sentence_embedding.rs
+++ b/encoderfile/src/builder/transforms/validation/sentence_embedding.rs
@@ -59,7 +59,7 @@ impl TransformValidatorExt for SentenceEmbeddingTransform {
 #[cfg(test)]
 mod tests {
     use crate::builder::config::{EncoderfileConfig, ModelPath};
-    use crate::common::ModelType;
+    use crate::common::model_type::ModelType;
     use crate::transforms::DEFAULT_LIBS;
 
     use super::*;
diff --git a/encoderfile/src/builder/transforms/validation/sequence_classification.rs b/encoderfile/src/builder/transforms/validation/sequence_classification.rs
index 6c4879dc..50615834 100644
--- a/encoderfile/src/builder/transforms/validation/sequence_classification.rs
+++ b/encoderfile/src/builder/transforms/validation/sequence_classification.rs
@@ -55,7 +55,7 @@ impl TransformValidatorExt for SequenceClassificationTransform {
 #[cfg(test)]
 mod tests {
     use crate::builder::config::{EncoderfileConfig, ModelPath};
-    use crate::common::ModelType;
+    use crate::common::model_type::ModelType;
     use crate::transforms::DEFAULT_LIBS;
 
     use super::*;
diff --git a/encoderfile/src/builder/transforms/validation/token_classification.rs b/encoderfile/src/builder/transforms/validation/token_classification.rs
index 42801a9b..30d2c75e 100644
--- a/encoderfile/src/builder/transforms/validation/token_classification.rs
+++ b/encoderfile/src/builder/transforms/validation/token_classification.rs
@@ -56,7 +56,7 @@ impl TransformValidatorExt for TokenClassificationTransform {
 #[cfg(test)]
 mod tests {
     use crate::builder::config::{EncoderfileConfig, ModelPath};
-    use crate::common::ModelType;
+    use crate::common::model_type::ModelType;
     use crate::transforms::DEFAULT_LIBS;
 
     use super::*;
diff --git a/encoderfile/src/common/image_classification.rs b/encoderfile/src/common/image_classification.rs
new file mode 100644
index 00000000..4eb44e54
--- /dev/null
+++ b/encoderfile/src/common/image_classification.rs
@@ -0,0 +1,113 @@
+use serde::{Deserialize, Serialize};
+use std::{collections::HashMap, io::Read};
+use utoipa::ToSchema;
+use anyhow::Result;
+use crate::common::FromReadInput;
+use image::ImageFormat;
+use bytes::Bytes;
+use crate::transport::http::multipart_openapi::{FromMultipart, MultipartApiError};
+use crate::common::image_types::{ImageInfo, ImageLabelScore};
+
+#[derive(Debug, Serialize, Deserialize)]
+pub struct ImageClassificationRequest {
+    pub images: Vec<ImageInfo>,
+    pub metadata: Option<HashMap<String, String>>,
+}
+
+// FIXME check if we need to reorganize the from*input traits
+impl super::FromCliInput for ImageClassificationRequest {
+    fn from_cli_input(inputs: Vec<String>) -> Self {
+        let images = inputs.into_iter().map(|path| {
+            let image_data = std::fs::read(path).expect("Failed to read image file");
+            let format = image::guess_format(&image_data).expect("Failed to guess image format");
+            ImageInfo {
+                image_bytes: Bytes::from(image_data),
+                image_format: format,
+            }
+        }).collect();
+
+        Self {
+            images,
+            metadata: Some(HashMap::default()),
+        }
+    }
+}
+
+impl FromReadInput for ImageClassificationRequest {
+    fn from_read_input(input: Vec<&mut impl Read>) -> Result<Self> {
+        let images = input.into_iter().map(|reader| {
+            let mut image_data = Vec::new();
+            reader.read_to_end(&mut image_data).map_err(|e| anyhow::anyhow!("Failed to read image data: {}", e))?;
+            let format = image::guess_format(&image_data).map_err(|e| anyhow::anyhow!("Failed to guess image format: {}", e))?;
+            Ok(ImageInfo {
+                image_bytes: Bytes::from(image_data),
+                image_format: format,
+            })
+        }).collect::<Result<Vec<ImageInfo>>>()?;
+
+        Ok(Self {
+            images,
+            metadata: Some(HashMap::default()),
+        })
+    }
+}
+
+impl FromMultipart for ImageClassificationRequest {
+    fn from_multipart(
+        payload: serde_json::Value,
+        attachments: Vec<(Option<String>, Option<String>, bytes::Bytes)>,
+    ) -> Result<Self, MultipartApiError> {
+        let images = attachments
+            .into_iter()
+            .map(|(_file_name, _content_type, image_bytes)| {
+                let format = image::guess_format(&image_bytes)
+                    .map_err(|e| MultipartApiError::RequestConstruction(
+                        format!("Failed to detect image format: {}", e)
+                    ))?;
+                Ok(ImageInfo {
+                    image_bytes,
+                    image_format: format,
+                })
+            })
+            .collect::<Result<Vec<_>, _>>()?;
+
+        let metadata = if payload.is_null() || payload == serde_json::json!({}) {
+            Some(HashMap::default())
+        } else {
+            serde_json::from_value(payload)
+                .ok()
+                .or(Some(HashMap::default()))
+        };
+
+        Ok(Self { images, metadata })
+    }
+}
+
+#[derive(Debug, Serialize, Deserialize, ToSchema, utoipa::ToResponse)]
+pub struct ImageClassificationResponse {
+    pub results: Vec<ImageClassificationResult>,
+    #[serde(skip_serializing_if = "Option::is_none")]
+    pub metadata: Option<HashMap<String, String>>,
+}
+
+#[derive(Debug, Serialize, Deserialize, ToSchema, Clone)]
+pub struct ImageClassificationResult {
+    pub labels: Vec<ImageLabelScore>,
+}
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+    use std::fs::File;
+
+    #[test]
+    fn test_image_classification_request_from_read_input() {
+        let mut file = File::open("../test-pictures/w3c_home.jpg").expect("Failed to open test image");
+        let file_vec = vec![&mut file];
+        let request = ImageClassificationRequest::from_read_input(file_vec).expect("Failed to create request from read input");
+
+        assert_eq!(request.images.len(), 1);
+        assert_eq!(request.images[0].image_format, ImageFormat::Jpeg);
+        assert!(!request.images[0].image_bytes.is_empty());
+    }
+}
diff --git a/encoderfile/src/common/image_types.rs b/encoderfile/src/common/image_types.rs
new file mode 100644
index 00000000..5a0a2040
--- /dev/null
+++ b/encoderfile/src/common/image_types.rs
@@ -0,0 +1,28 @@
+use serde::{Deserialize, Serialize};
+use std::{collections::HashMap, io::Read};
+use utoipa::ToSchema;
+use anyhow::Result;
+use crate::common::FromReadInput;
+use image::ImageFormat;
+use bytes::Bytes;
+use crate::transport::http::multipart_openapi::{FromMultipart, MultipartApiError};
+
+#[derive(Debug, Serialize, Deserialize)]
+pub struct ImageInfo {
+    pub image_bytes: Bytes,
+    pub image_format: ImageFormat,
+}
+
+#[derive(Debug, Serialize, Deserialize, ToSchema, Clone)]
+pub struct ImageLabelScore {
+    pub label: String,
+    pub score: Option<f32>,
+}
+
+
+#[derive(Debug, Serialize, Deserialize, ToSchema, Clone)]
+pub struct ImageLabels {
+    pub labels: Vec<ImageLabelScore>,
+}
+
+
diff --git a/encoderfile/src/common/mod.rs b/encoderfile/src/common/mod.rs
index 56549e37..ea81671d 100644
--- a/encoderfile/src/common/mod.rs
+++ b/encoderfile/src/common/mod.rs
@@ -8,16 +8,30 @@ mod sequence_classification;
 mod token;
 mod token_classification;
 
+// CV
+mod image_classification;
+mod image_types;
+
 pub use config::*;
 pub use embedding::*;
 pub use model_config::*;
 pub use model_metadata::*;
-pub use model_type::ModelType;
 pub use sentence_embedding::*;
 pub use sequence_classification::*;
 pub use token::*;
 pub use token_classification::*;
 
+// CV
+pub use image_classification::*;
+pub use image_types::*;
+use std::io::Read;
+use anyhow::Result;
+
 pub trait FromCliInput {
     fn from_cli_input(inputs: Vec<String>) -> Self;
 }
+
+pub trait FromReadInput {
+    fn from_read_input(input: Vec<&mut impl Read>) -> Result<Self>
+    where Self: Sized;
+}
diff --git a/encoderfile/src/common/model_config.rs b/encoderfile/src/common/model_config.rs
index 89eb4e2d..2e9d08c7 100644
--- a/encoderfile/src/common/model_config.rs
+++ b/encoderfile/src/common/model_config.rs
@@ -4,11 +4,17 @@ use std::collections::HashMap;
 #[derive(Debug, Serialize, Deserialize, Clone)]
 pub struct ModelConfig {
     pub model_type: String,
+    // FIXME to be moved to per-task structs
     pub num_labels: Option<usize>,
     pub id2label: Option<HashMap<u32, String>>,
     pub label2id: Option<HashMap<String, u32>>,
+    pub height: Option<u32>,
+    pub width: Option<u32>,
+    pub image_size: Option<u32>,
+    pub num_channels: Option<u32>,
 }
 
+// TODO add image handling metadata
 impl ModelConfig {
     pub fn id2label(&self, id: u32) -> Option<&str> {
         self.id2label.as_ref()?.get(&id).map(|s| s.as_str())
@@ -19,13 +25,13 @@ impl ModelConfig {
     }
 
     pub fn num_labels(&self) -> Option<usize> {
-        if self.num_labels.is_some() {
-            return self.num_labels;
+        if let Some(num_labels) = self.num_labels {
+            return Some(num_labels);
         }
 
         if let Some(id2label) = &self.id2label {
             return Some(id2label.len());
-        }
+            }
 
         if let Some(label2id) = &self.label2id {
             return Some(label2id.len());
@@ -33,6 +39,17 @@ impl ModelConfig {
 
         None
     }
+    pub fn height(&self) -> Option<u32> {
+        self.height.or(self.image_size)
+    }
+
+    pub fn width(&self) -> Option<u32> {
+        self.width.or(self.image_size)
+    }
+
+    pub fn num_channels(&self) -> Option<u32> {
+        self.num_channels
+    }
 }
 
 #[cfg(test)]
@@ -58,6 +75,10 @@ mod tests {
             num_labels: Some(3),
             id2label: Some(id2label.clone()),
             label2id: Some(label2id.clone()),
+            height: None,
+            width: None,
+            image_size: None,
+            num_channels: None,
         };
 
         assert_eq!(config.num_labels(), Some(3));
@@ -67,6 +88,10 @@ mod tests {
             num_labels: None,
             id2label: Some(id2label.clone()),
             label2id: Some(label2id.clone()),
+            height: None,
+            width: None,
+            image_size: None,
+            num_channels: None,
         };
 
         assert_eq!(config.num_labels(), Some(3));
@@ -76,6 +101,10 @@ mod tests {
             num_labels: None,
             id2label: None,
             label2id: Some(label2id.clone()),
+            height: None,
+            width: None,
+            image_size: None,
+            num_channels: None,
         };
 
         assert_eq!(config.num_labels(), Some(3));
diff --git a/encoderfile/src/common/model_type.rs b/encoderfile/src/common/model_type.rs
index 96cc7d3e..26a28880 100644
--- a/encoderfile/src/common/model_type.rs
+++ b/encoderfile/src/common/model_type.rs
@@ -1,5 +1,9 @@
 macro_rules! model_type {
     [ $( $x:ident ),* $(,)? ] => {
+        pub trait ModelTypeSpec: Send + Sync + Clone + std::fmt::Debug + 'static {
+        fn enum_val() -> ModelType;
+        }
+
         // create enum
         #[derive(Debug, Clone, PartialEq, Eq, serde::Serialize, serde::Deserialize, utoipa::ToSchema, schemars::JsonSchema)]
         #[serde(rename_all = "snake_case")]
@@ -38,6 +42,7 @@ macro_rules! model_type {
                 }
             }
         )*
+
     }
 }
 
@@ -46,8 +51,5 @@ model_type![
     SequenceClassification,
     TokenClassification,
     SentenceEmbedding,
+    ImageClassification
 ];
-
-pub trait ModelTypeSpec: Send + Sync + Clone + std::fmt::Debug + 'static {
-    fn enum_val() -> ModelType;
-}
diff --git a/encoderfile/src/dev_utils/mod.rs b/encoderfile/src/dev_utils/mod.rs
index 6f9a371a..9eefeecd 100644
--- a/encoderfile/src/dev_utils/mod.rs
+++ b/encoderfile/src/dev_utils/mod.rs
@@ -1,9 +1,18 @@
 use crate::{
     common::{
-        Config, ModelConfig, TokenizerConfig,
+        Config, TokenizerConfig,
         model_type::{self, ModelTypeSpec},
     },
-    runtime::{AppState, EncoderfileState},
+    runtime::{
+        AppState,
+        EncoderfileState,
+        FeatureExtractorState,
+        ClassifierState,
+        TextInputState,
+        ImageInputState,
+        InputType,
+        TaskType,
+    },
 };
 use ort::session::Session;
 use parking_lot::Mutex;
@@ -11,10 +20,12 @@ use std::str::FromStr;
 use std::{fs::File, io::BufReader};
 
 const EMBEDDING_DIR: &str = "../models/embedding";
+// CHECK sentence embedding????
 const SEQUENCE_CLASSIFICATION_DIR: &str = "../models/sequence_classification";
 const TOKEN_CLASSIFICATION_DIR: &str = "../models/token_classification";
 
-pub fn get_state<T: ModelTypeSpec>(dir: &str) -> AppState<T> {
+pub fn get_state<T: ModelTypeSpec + InputTypeFromFile + TaskTypeFromFile>(dir: &str) -> AppState<T>
+{
     let config = Config {
         name: "my-model".to_string(),
         version: "0.0.1".to_string(),
@@ -23,37 +34,114 @@ pub fn get_state<T: ModelTypeSpec>(dir: &str) -> AppState<T> {
         lua_libs: None,
     };
 
-    let model_config = get_model_config(dir);
-    let tokenizer = get_tokenizer(dir);
     let session = get_model(dir);
 
-    EncoderfileState::new(config, session, tokenizer, model_config).into()
+    EncoderfileState::new(
+        config,
+        session,
+        T::get_input_state(dir),
+        T::get_task_state(dir),
+    ).into()
 }
 
-pub fn embedding_state() -> AppState<model_type::Embedding> {
-    get_state(EMBEDDING_DIR)
+pub trait TaskTypeFromFile: TaskType {
+    fn get_task_state(dir: &str) -> Self::TaskState;
 }
 
-pub fn sentence_embedding_state() -> AppState<model_type::SentenceEmbedding> {
-    get_state(EMBEDDING_DIR)
+pub trait InputTypeFromFile: InputType {
+    fn get_input_state(dir: &str) -> Self::InputState;
 }
 
-pub fn sequence_classification_state() -> AppState<model_type::SequenceClassification> {
-    get_state(SEQUENCE_CLASSIFICATION_DIR)
+pub fn get_reader(dir: &str) -> BufReader<File> {
+    let file = File::open(format!("{}/{}", dir, "config.json")).expect("Config not found");
+    BufReader::new(file)
 }
 
-pub fn token_classification_state() -> AppState<model_type::TokenClassification> {
-    get_state(TOKEN_CLASSIFICATION_DIR)
+// Input types
+fn get_text_input_state(dir: &str) -> TextInputState {
+    let reader = get_reader(dir);
+    let tokenizer = get_tokenizer(dir);
+    let model_config = serde_json::from_reader(reader).expect("Invalid model config");
+
+    TextInputState { tokenizer, model_config }
 }
 
-fn get_model_config(dir: &str) -> ModelConfig {
-    let file = File::open(format!("{}/{}", dir, "config.json")).expect("Config not found");
-    let reader = BufReader::new(file);
+fn get_image_input_state(dir: &str) -> ImageInputState {
+    let reader = get_reader(dir);
+    let incomplete_state: ImageInputState = serde_json::from_reader(reader).expect("Invalid model config");
+    ImageInputState {
+        num_channels: incomplete_state.num_channels,
+        height: incomplete_state.height.or(incomplete_state.image_size),
+        width: incomplete_state.width.or(incomplete_state.image_size),
+        image_size: incomplete_state.image_size,
+    }
+}
+
+macro_rules! input_state_impl {
+    ($model_type:ty, $state_fun:ident) => {
+        impl InputTypeFromFile for $model_type {
+            fn get_input_state(dir: &str) -> Self::InputState {
+                $state_fun(dir)
+            }
+        }
+    };
+}
 
-    // Deserialize into struct
+input_state_impl!(model_type::SequenceClassification, get_text_input_state);
+input_state_impl!(model_type::TokenClassification, get_text_input_state);
+input_state_impl!(model_type::ImageClassification, get_image_input_state);
+input_state_impl!(model_type::Embedding, get_text_input_state);
+input_state_impl!(model_type::SentenceEmbedding, get_text_input_state);
+
+
+// Task types
+fn get_class_task_state(dir: &str) -> ClassifierState {
+    let reader = get_reader(dir);
     serde_json::from_reader(reader).expect("Invalid model config")
 }
 
+fn get_feature_task_state(_dir: &str) -> FeatureExtractorState {
+    FeatureExtractorState {}
+}
+
+macro_rules! task_state_impl {
+    ($model_type:ty, $state_fun:ident) => {
+        impl TaskTypeFromFile for $model_type {
+            fn get_task_state(dir: &str) -> Self::TaskState {
+                $state_fun(dir)
+            }
+        }
+    };
+}
+
+task_state_impl!(model_type::SequenceClassification, get_class_task_state);
+task_state_impl!(model_type::TokenClassification, get_class_task_state);
+task_state_impl!(model_type::ImageClassification, get_class_task_state);
+task_state_impl!(model_type::Embedding, get_feature_task_state);
+task_state_impl!(model_type::SentenceEmbedding, get_feature_task_state);
+
+
+
+pub fn embedding_state() -> AppState<model_type::Embedding>
+{
+    get_state(EMBEDDING_DIR)
+}
+
+pub fn sentence_embedding_state() -> AppState<model_type::SentenceEmbedding>
+{
+    get_state(EMBEDDING_DIR)
+}
+
+pub fn sequence_classification_state() -> AppState<model_type::SequenceClassification>
+{
+    get_state(SEQUENCE_CLASSIFICATION_DIR)
+}
+
+pub fn token_classification_state() -> AppState<model_type::TokenClassification>
+{
+    get_state(TOKEN_CLASSIFICATION_DIR)
+}
+
 fn get_tokenizer(dir: &str) -> crate::runtime::TokenizerService {
     let tokenizer_str = std::fs::read_to_string(format!("{}/{}", dir, "tokenizer.json"))
         .expect("Tokenizer json not found");
diff --git a/encoderfile/src/format/assets/kind.rs b/encoderfile/src/format/assets/kind.rs
index d7a12f1a..9ea67f32 100644
--- a/encoderfile/src/format/assets/kind.rs
+++ b/encoderfile/src/format/assets/kind.rs
@@ -1,4 +1,4 @@
-use crate::common::model_type::ModelTypeSpec;
+use crate::{common::model_type::ModelTypeSpec, runtime::{Input, InputType, Task, TaskType}};
 
 /// Identifies the semantic role of an embedded artifact.
 ///
@@ -50,27 +50,43 @@ impl AssetKind {
     ];
 }
 
-pub trait AssetPolicySpec: ModelTypeSpec {
-    fn required_assets() -> &'static [AssetKind];
-    fn optional_assets() -> &'static [AssetKind];
+pub trait AssetPolicySpec: ModelTypeSpec + InputType + TaskType {
+    fn required_assets() -> &'static [AssetKind] {
+        match (Self::input_type(), Self::task_type()) {
+            (Input::Text, Task::Classification) => &[
+                AssetKind::ModelWeights,
+                AssetKind::ModelConfig,
+                AssetKind::Tokenizer,
+            ],
+            (Input::Text, Task::FeatureExtraction) => &[
+                AssetKind::ModelWeights,
+                AssetKind::ModelConfig,
+                AssetKind::Tokenizer,
+            ],
+            (Input::Image, Task::Classification) => &[
+                AssetKind::ModelWeights,
+                AssetKind::ModelConfig,
+            ],
+            (Input::Image, Task::FeatureExtraction) => &[
+                AssetKind::ModelWeights,
+                AssetKind::ModelConfig,
+            ],
+        }
+    }
+    fn optional_assets() -> &'static [AssetKind] {
+        match (Self::input_type(), Self::task_type()) {
+            (Input::Text, Task::Classification) => &[AssetKind::Transform],
+            (Input::Text, Task::FeatureExtraction) => &[AssetKind::Transform],
+            (Input::Image, Task::Classification) => &[AssetKind::Transform],
+            (Input::Image, Task::FeatureExtraction) => &[AssetKind::Transform],
+        }
+    }
 }
 
 macro_rules! asset_policy_spec {
     // Huggingface-style encoders
     (Encoder, $model_type:ident) => {
-        impl AssetPolicySpec for crate::common::model_type::$model_type {
-            fn required_assets() -> &'static [AssetKind] {
-                &[
-                    AssetKind::ModelWeights,
-                    AssetKind::ModelConfig,
-                    AssetKind::Tokenizer,
-                ]
-            }
-
-            fn optional_assets() -> &'static [AssetKind] {
-                &[AssetKind::Transform]
-            }
-        }
+        impl AssetPolicySpec for crate::common::model_type::$model_type {}
     };
 }
 
@@ -78,3 +94,4 @@ asset_policy_spec!(Encoder, Embedding);
 asset_policy_spec!(Encoder, SequenceClassification);
 asset_policy_spec!(Encoder, TokenClassification);
 asset_policy_spec!(Encoder, SentenceEmbedding);
+asset_policy_spec!(Encoder, ImageClassification);
diff --git a/encoderfile/src/format/codec/encoder.rs b/encoderfile/src/format/codec/encoder.rs
index 6972c2c7..96c7ab11 100644
--- a/encoderfile/src/format/codec/encoder.rs
+++ b/encoderfile/src/format/codec/encoder.rs
@@ -3,13 +3,13 @@ use anyhow::{Result, bail};
 
 use crate::{
     common::model_type::{
-        Embedding, ModelType, SentenceEmbedding, SequenceClassification, TokenClassification,
+        Embedding, ImageClassification, ModelType, SentenceEmbedding, SequenceClassification, TokenClassification,
     },
     format::{
         assets::{AssetPlan, AssetPolicySpec},
         footer::EncoderfileFooter,
     },
-    generated::manifest::{Artifact, Backend, EncoderfileManifest},
+    generated::manifest::{Artifact, Backend, EncoderfileManifest}, runtime::InputType,
 };
 
 use prost::Message;
@@ -86,6 +86,7 @@ impl EncoderfileCodec {
             }
             ModelType::TokenClassification => Self::validate_assets::<TokenClassification>(plan)?,
             ModelType::SentenceEmbedding => Self::validate_assets::<SentenceEmbedding>(plan)?,
+            ModelType::ImageClassification => Self::validate_assets::<ImageClassification>(plan)?,
         };
 
         let model_type: crate::generated::metadata::ModelType = model_type.into();
diff --git a/encoderfile/src/format/container.rs b/encoderfile/src/format/container.rs
index 6bd5522e..496dad49 100644
--- a/encoderfile/src/format/container.rs
+++ b/encoderfile/src/format/container.rs
@@ -2,7 +2,7 @@ use anyhow::Result;
 use std::io::{Read, Seek, SeekFrom};
 
 use crate::{
-    common::ModelType,
+    common::model_type::ModelType,
     format::{assets::AssetKind, footer::EncoderfileFooter},
     generated::manifest::{Artifact, EncoderfileManifest},
 };
diff --git a/encoderfile/src/generated/image_classification.rs b/encoderfile/src/generated/image_classification.rs
new file mode 100644
index 00000000..bedfde9c
--- /dev/null
+++ b/encoderfile/src/generated/image_classification.rs
@@ -0,0 +1,35 @@
+use crate::{common, generated::image_types::ImageLabels};
+
+tonic::include_proto!("encoderfile.image_classification");
+
+impl From<ImageClassificationRequest> for common::ImageClassificationRequest {
+    fn from(val: ImageClassificationRequest) -> Self {
+        let images = val.inputs.into_iter().map(|input| {
+            common::ImageInfo {
+                image_bytes: bytes::Bytes::from(input.image),
+                image_format: image::ImageFormat::Png, // TODO: detect format properly
+            }
+        }).collect();
+        Self {
+            images,
+            metadata: if val.metadata.is_empty() { None } else { Some(val.metadata) },
+        }
+    }
+}
+
+impl From<common::ImageClassificationResponse> for ImageClassificationResponse {
+    fn from(val: common::ImageClassificationResponse) -> Self {
+        Self {
+            labels: val.results.into_iter().map(|result| result.into()).collect(),
+            metadata: val.metadata.unwrap_or_default(),
+        }
+    }
+}
+
+impl From<common::ImageClassificationResult> for ImageLabels {
+    fn from(val: common::ImageClassificationResult) -> Self {
+        ImageLabels {
+            labels: val.labels.into_iter().map(|label| label.into()).collect(),
+        }
+    }
+}
diff --git a/encoderfile/src/generated/image_types.rs b/encoderfile/src/generated/image_types.rs
new file mode 100644
index 00000000..d8b9a452
--- /dev/null
+++ b/encoderfile/src/generated/image_types.rs
@@ -0,0 +1,28 @@
+use crate::common;
+
+tonic::include_proto!("encoderfile.image_types");
+
+impl From<common::ImageInfo> for ImageInput {
+    fn from(val: common::ImageInfo) -> Self {
+        ImageInput {
+            image: val.image_bytes.to_vec(),
+        }
+    }
+}
+
+impl From<common::ImageLabelScore> for ImageLabelScore {
+    fn from(val: common::ImageLabelScore) -> Self {
+        ImageLabelScore {
+            label: val.label,
+            score: val.score,
+        }
+    }
+}
+    
+impl From<common::ImageLabels> for ImageLabels {
+    fn from(val: common::ImageLabels) -> Self {
+        ImageLabels {
+            labels: val.labels.into_iter().map(|label| label.into()).collect(),
+        }
+    }
+}
diff --git a/encoderfile/src/generated/metadata.rs b/encoderfile/src/generated/metadata.rs
index 33a660a4..e7d68479 100644
--- a/encoderfile/src/generated/metadata.rs
+++ b/encoderfile/src/generated/metadata.rs
@@ -12,24 +12,26 @@ impl From<common::GetModelMetadataResponse> for GetModelMetadataResponse {
     }
 }
 
-impl From<common::ModelType> for ModelType {
-    fn from(val: common::ModelType) -> Self {
+impl From<common::model_type::ModelType> for ModelType {
+    fn from(val: common::model_type::ModelType) -> Self {
         match val {
-            common::ModelType::Embedding => Self::Embedding,
-            common::ModelType::SequenceClassification => Self::SequenceClassification,
-            common::ModelType::TokenClassification => Self::TokenClassification,
-            common::ModelType::SentenceEmbedding => Self::SentenceEmbedding,
+            common::model_type::ModelType::Embedding => Self::Embedding,
+            common::model_type::ModelType::SequenceClassification => Self::SequenceClassification,
+            common::model_type::ModelType::TokenClassification => Self::TokenClassification,
+            common::model_type::ModelType::SentenceEmbedding => Self::SentenceEmbedding,
+            common::model_type::ModelType::ImageClassification => Self::ImageClassification,
         }
     }
 }
 
-impl From<ModelType> for common::ModelType {
+impl From<ModelType> for common::model_type::ModelType {
     fn from(val: ModelType) -> Self {
         match val {
-            ModelType::Embedding => common::ModelType::Embedding,
-            ModelType::SequenceClassification => common::ModelType::SequenceClassification,
-            ModelType::TokenClassification => common::ModelType::TokenClassification,
-            ModelType::SentenceEmbedding => common::ModelType::SentenceEmbedding,
+            ModelType::Embedding => common::model_type::ModelType::Embedding,
+            ModelType::SequenceClassification => common::model_type::ModelType::SequenceClassification,
+            ModelType::TokenClassification => common::model_type::ModelType::TokenClassification,
+            ModelType::SentenceEmbedding => common::model_type::ModelType::SentenceEmbedding,
+            ModelType::ImageClassification => common::model_type::ModelType::ImageClassification,
             ModelType::Unspecified => {
                 unreachable!("Unspecified model type. This should not happen.")
             }
diff --git a/encoderfile/src/generated/mod.rs b/encoderfile/src/generated/mod.rs
index 79d1fbe4..e617876e 100644
--- a/encoderfile/src/generated/mod.rs
+++ b/encoderfile/src/generated/mod.rs
@@ -5,3 +5,5 @@ pub mod sentence_embedding;
 pub mod sequence_classification;
 pub mod token;
 pub mod token_classification;
+pub mod image_classification;
+pub mod image_types;
diff --git a/encoderfile/src/inference/embedding.rs b/encoderfile/src/inference/embedding.rs
index af125053..9aa062c8 100644
--- a/encoderfile/src/inference/embedding.rs
+++ b/encoderfile/src/inference/embedding.rs
@@ -13,7 +13,7 @@ pub fn embedding<'a>(
     transform: &EmbeddingTransform,
     encodings: Vec<Encoding>,
 ) -> Result<Vec<TokenEmbeddingSequence>, ApiError> {
-    let (a_ids, a_mask, a_type_ids) = crate::prepare_inputs!(encodings);
+    let (a_ids, a_mask, a_type_ids) = crate::prepare_text_inputs!(encodings);
 
     let mut outputs = crate::run_model!(session, a_ids, a_mask, a_type_ids)?
         .get("last_hidden_state")
diff --git a/encoderfile/src/inference/image_classification.rs b/encoderfile/src/inference/image_classification.rs
new file mode 100644
index 00000000..fc6523b7
--- /dev/null
+++ b/encoderfile/src/inference/image_classification.rs
@@ -0,0 +1,64 @@
+use std::os::raw;
+
+use ndarray::{Array2, Array4, Ix2, Axis, s};
+
+use crate::{
+    error::ApiError,
+};
+
+use crate::common::{ImageLabelScore};
+
+fn logit_to_prob(logit: f32) -> f32 {
+    1.0 / (1.0 + (-logit).exp())
+}
+
+#[tracing::instrument(skip_all)]
+pub fn image_classification<'a>(
+    mut session: crate::runtime::Model<'a>,
+    // CHECK if this is a vec of flattened rgb images with num_channels X height X width
+    images: Array4<f32>,
+    classes: Vec<String>,
+) -> Result<Vec<Vec<ImageLabelScore>>, ApiError> {
+    let grouped_images = ort::value::TensorRef::from_array_view(
+        &images)
+        .unwrap()
+        .to_owned();
+    let raw_outputs = crate::run_cv_model!(session, grouped_images)?;
+    println!("Raw outputs: {:?}", raw_outputs.keys().collect::<Vec<_>>());
+    let mut outputs = raw_outputs
+        .get("logits")
+        .expect("Model does not return logits")
+        .try_extract_array::<f32>()
+        .expect("Model does not return tensor extractable to f32")
+        .into_dimensionality::<Ix2>()
+        .expect("Model does not return tensor of shape [n_batch, n_classes]")
+        .into_owned();
+    println!("Model outputs: {:?}", outputs);
+    outputs.mapv_inplace(logit_to_prob);
+    println!("Model outputs: {:?}", outputs);
+
+    Ok(postprocess(outputs, classes))
+}
+
+#[tracing::instrument(skip_all)]
+pub fn postprocess(outputs: Array2<f32>, classes: Vec<String>) -> Vec<Vec<ImageLabelScore>> {
+    outputs
+        .axis_iter(Axis(0))
+        .map(|logs| {
+            logs.iter().enumerate()
+                .map(|(idx, score)| {
+                        ImageLabelScore {
+                            label: classes[idx].to_string(), // TODO: get label from config
+                            score: Some(*score)
+                        }
+                    }
+                )
+                .collect()
+        })
+        .collect()
+}
+
+#[cfg(test)]
+mod tests {
+    // Add your test cases here
+}
\ No newline at end of file
diff --git a/encoderfile/src/inference/mod.rs b/encoderfile/src/inference/mod.rs
index 09803536..e9b82a92 100644
--- a/encoderfile/src/inference/mod.rs
+++ b/encoderfile/src/inference/mod.rs
@@ -1,5 +1,8 @@
+// text
 pub mod embedding;
 pub mod sentence_embedding;
 pub mod sequence_classification;
 pub mod token_classification;
+// cv
+pub mod image_classification;
 pub mod utils;
diff --git a/encoderfile/src/inference/sentence_embedding.rs b/encoderfile/src/inference/sentence_embedding.rs
index ea0e3051..d2a876af 100644
--- a/encoderfile/src/inference/sentence_embedding.rs
+++ b/encoderfile/src/inference/sentence_embedding.rs
@@ -13,7 +13,7 @@ pub fn sentence_embedding<'a>(
     transform: &SentenceEmbeddingTransform,
     encodings: Vec<Encoding>,
 ) -> Result<Vec<SentenceEmbedding>, ApiError> {
-    let (a_ids, a_mask, a_type_ids) = crate::prepare_inputs!(encodings);
+    let (a_ids, a_mask, a_type_ids) = crate::prepare_text_inputs!(encodings);
 
     let a_mask_arr = a_mask
         .try_extract_array::<i64>()
diff --git a/encoderfile/src/inference/sequence_classification.rs b/encoderfile/src/inference/sequence_classification.rs
index f003a07e..1a37a3f7 100644
--- a/encoderfile/src/inference/sequence_classification.rs
+++ b/encoderfile/src/inference/sequence_classification.rs
@@ -1,7 +1,5 @@
 use crate::{
-    common::{ModelConfig, SequenceClassificationResult},
-    error::ApiError,
-    transforms::{Postprocessor, SequenceClassificationTransform},
+    common::{ModelConfig, SequenceClassificationResult}, error::ApiError, runtime::ClassifierState, transforms::{Postprocessor, SequenceClassificationTransform}
 };
 use ndarray::{Array2, Axis, Ix2};
 use ndarray_stats::QuantileExt;
@@ -11,10 +9,10 @@ use tokenizers::Encoding;
 pub fn sequence_classification<'a>(
     mut session: crate::runtime::Model<'a>,
     transform: &SequenceClassificationTransform,
-    config: &ModelConfig,
+    config: &ClassifierState,
     encodings: Vec<Encoding>,
 ) -> Result<Vec<SequenceClassificationResult>, ApiError> {
-    let (a_ids, a_mask, a_type_ids) = crate::prepare_inputs!(encodings);
+    let (a_ids, a_mask, a_type_ids) = crate::prepare_text_inputs!(encodings);
 
     let mut outputs = crate::run_model!(session, a_ids, a_mask, a_type_ids)?
         .get("logits")
@@ -35,7 +33,7 @@ pub fn sequence_classification<'a>(
 #[tracing::instrument(skip_all)]
 pub fn postprocess(
     outputs: Array2<f32>,
-    config: &ModelConfig,
+    config: &ClassifierState,
 ) -> Vec<SequenceClassificationResult> {
     outputs
         .axis_iter(Axis(0))
diff --git a/encoderfile/src/inference/token_classification.rs b/encoderfile/src/inference/token_classification.rs
index 732073f0..3d5181fa 100644
--- a/encoderfile/src/inference/token_classification.rs
+++ b/encoderfile/src/inference/token_classification.rs
@@ -1,7 +1,5 @@
 use crate::{
-    common::{ModelConfig, TokenClassification, TokenClassificationResult, TokenInfo},
-    error::ApiError,
-    transforms::{Postprocessor, TokenClassificationTransform},
+    common::{ModelConfig, TokenClassification, TokenClassificationResult, TokenInfo}, error::ApiError, runtime::ClassifierState, transforms::{Postprocessor, TokenClassificationTransform}
 };
 use ndarray::{Array3, Axis, Ix3};
 use ndarray_stats::QuantileExt;
@@ -11,10 +9,10 @@ use tokenizers::Encoding;
 pub fn token_classification<'a>(
     mut session: crate::runtime::Model<'a>,
     transform: &TokenClassificationTransform,
-    config: &ModelConfig,
+    config: &ClassifierState,
     encodings: Vec<Encoding>,
 ) -> Result<Vec<TokenClassificationResult>, ApiError> {
-    let (a_ids, a_mask, a_type_ids) = crate::prepare_inputs!(encodings);
+    let (a_ids, a_mask, a_type_ids) = crate::prepare_text_inputs!(encodings);
 
     let mut outputs = crate::run_model!(session, a_ids, a_mask, a_type_ids)?
         .get("logits")
@@ -36,7 +34,7 @@ pub fn token_classification<'a>(
 pub fn postprocess(
     outputs: Array3<f32>,
     encodings: Vec<Encoding>,
-    config: &ModelConfig,
+    config: &ClassifierState,
 ) -> Vec<TokenClassificationResult> {
     let mut predictions = Vec::new();
 
diff --git a/encoderfile/src/inference/utils.rs b/encoderfile/src/inference/utils.rs
index a59f1f62..58f27075 100644
--- a/encoderfile/src/inference/utils.rs
+++ b/encoderfile/src/inference/utils.rs
@@ -3,7 +3,7 @@ use ort::session::Session;
 use parking_lot::MutexGuard;
 
 #[macro_export]
-macro_rules! prepare_inputs {
+macro_rules! prepare_text_inputs {
     ($encodings:ident) => {{
         let padded_token_length = $encodings[0].len();
 
@@ -75,3 +75,14 @@ macro_rules! run_model {
         })
     }};
 }
+
+#[macro_export]
+macro_rules! run_cv_model {
+    ($session:expr, $image_bytes:expr) => {{
+        $session.run(ort::inputs!($image_bytes))
+        .map_err(|e| {
+            tracing::error!("Error running model: {:?}", e);
+            $crate::error::ApiError::InternalError("Error running model")
+        })
+    }};
+}
diff --git a/encoderfile/src/runtime/loader.rs b/encoderfile/src/runtime/loader.rs
index b00959c4..92d2278c 100644
--- a/encoderfile/src/runtime/loader.rs
+++ b/encoderfile/src/runtime/loader.rs
@@ -5,7 +5,7 @@ use std::io::{Read, Seek};
 use ort::session::Session;
 
 use crate::{
-    common::{Config, LuaLibs, ModelConfig, ModelType},
+    common::{Config, LuaLibs, ModelConfig, model_type::ModelType},
     format::{assets::AssetKind, codec::EncoderfileCodec, container::Encoderfile},
     generated::manifest::{self, TransformType},
     runtime::TokenizerService,
diff --git a/encoderfile/src/runtime/mod.rs b/encoderfile/src/runtime/mod.rs
index 41d2bf86..57ae81c1 100644
--- a/encoderfile/src/runtime/mod.rs
+++ b/encoderfile/src/runtime/mod.rs
@@ -5,8 +5,22 @@ mod loader;
 mod state;
 mod tokenizer;
 
-pub use loader::{EncoderfileLoader, load_assets};
-pub use state::{AppState, EncoderfileState};
+pub use loader::{
+    EncoderfileLoader,
+    load_assets,
+};
+pub use state::{
+    AppState,
+    EncoderfileState,
+    Input,
+    Task,
+    InputType,
+    TaskType,
+    ClassifierState,
+    FeatureExtractorState,
+    ImageInputState,
+    TextInputState,
+};
 pub use tokenizer::TokenizerService;
 
 pub type Model<'a> = MutexGuard<'a, Session>;
diff --git a/encoderfile/src/runtime/state.rs b/encoderfile/src/runtime/state.rs
index 5690d99e..0010be37 100644
--- a/encoderfile/src/runtime/state.rs
+++ b/encoderfile/src/runtime/state.rs
@@ -1,32 +1,170 @@
 use std::{marker::PhantomData, sync::Arc};
+use serde::{Deserialize, Serialize};
 
 use ort::session::Session;
 use parking_lot::Mutex;
 
 use crate::{
-    common::{Config, ModelConfig, ModelType, model_type::ModelTypeSpec},
-    runtime::TokenizerService,
-    transforms::DEFAULT_LIBS,
+    common::{Config, ModelConfig, model_type::{ModelType, ModelTypeSpec, self}}, runtime::TokenizerService, transforms::DEFAULT_LIBS
 };
 
 pub type AppState<T> = Arc<EncoderfileState<T>>;
 
+#[derive(PartialEq)]
+pub enum Task {
+    Classification,
+    FeatureExtraction,
+}
+
+#[derive(PartialEq)]
+pub enum Input {
+    Text,
+    Image,
+}
+
+pub trait TaskType {
+    const TASK: Task;
+    fn task_type_val(&self) -> Task {
+        Self::task_type()
+    }
+    fn task_type() -> Task {
+        Self::TASK
+    }
+    type TaskState;
+}
+
+pub trait InputType {
+    const INPUT: Input;
+    fn input_type_val(&self) -> Input {
+        Self::input_type()
+    }
+    fn input_type() -> Input {
+        Self::INPUT
+    }
+    type InputState;
+}
+
+pub struct TextInputState {
+    pub tokenizer: TokenizerService,
+    pub model_config: ModelConfig,
+}
+#[derive(Debug, Serialize, Deserialize, Clone)]
+pub struct ImageInputState {
+    pub num_channels: u32,
+    pub height: Option<u32>,
+    pub width: Option<u32>,
+    pub image_size: Option<u32>,
+}
+
+#[derive(Debug, Serialize, Deserialize, Clone)]
+pub struct ClassifierState {
+    pub id2label: Option<std::collections::HashMap<u32, String>>,
+    pub label2id: Option<std::collections::HashMap<String, u32>>,
+    pub num_labels: Option<usize>,
+}
+impl ClassifierState {
+    pub fn id2label(&self, id: u32) -> Option<&str> {
+        self.id2label.as_ref()?.get(&id).map(|s| s.as_str())
+    }
+
+    pub fn label2id(&self, label: &str) -> Option<u32> {
+        self.label2id.as_ref()?.get(label).copied()
+    }
+
+    pub fn num_labels(&self) -> Option<usize> {
+        if self.num_labels.is_some() {
+            return self.num_labels;
+        }
+
+        if let Some(id2label) = &self.id2label {
+            return Some(id2label.len());
+        }
+
+        if let Some(label2id) = &self.label2id {
+            return Some(label2id.len());
+        }
+
+        None
+    }
+}
+
+#[derive(Debug, Serialize, Deserialize, Clone)]
+pub struct FeatureExtractorState {}
+
+macro_rules! input_state_impl {
+    ($model_type:ty, $state_type:ty, $input:expr) => {
+        impl InputType for $model_type {
+            const INPUT: Input = $input;
+            type InputState = $state_type;
+        }
+    };
+}
+
+input_state_impl!(model_type::Embedding, TextInputState, Input::Text);
+input_state_impl!(model_type::SentenceEmbedding, TextInputState, Input::Text);
+input_state_impl!(model_type::SequenceClassification, TextInputState, Input::Text);
+input_state_impl!(model_type::TokenClassification, TextInputState, Input::Text);
+input_state_impl!(model_type::ImageClassification, ImageInputState, Input::Image);
+
+macro_rules! task_state_impl {
+    ($model_type:ty, $state_type:ty, $task:expr) => {
+        impl TaskType for $model_type {
+            const TASK: Task = $task;
+            type TaskState = $state_type;
+        }
+    };
+}
+
+task_state_impl!(model_type::SequenceClassification, ClassifierState, Task::Classification);
+task_state_impl!(model_type::TokenClassification, ClassifierState, Task::Classification);
+task_state_impl!(model_type::ImageClassification, ClassifierState, Task::Classification);
+task_state_impl!(model_type::Embedding, FeatureExtractorState, Task::FeatureExtraction);
+task_state_impl!(model_type::SentenceEmbedding, FeatureExtractorState, Task::FeatureExtraction);
+
+macro_rules! input_type_impl {
+    [ $( $x:ident ),* $(,)? ] => {
+        impl ModelType {
+            pub fn input_type(&self) -> crate::runtime::Input {
+                match self {
+                    $(
+                        ModelType::$x => model_type::$x::input_type(),
+                    )*
+                }
+            }
+            pub fn task_type(&self) -> crate::runtime::Task {
+                match self {
+                    $(
+                        ModelType::$x => model_type::$x::task_type(),
+                    )*
+                }
+            }
+        }   
+    }
+}
+input_type_impl![
+    Embedding,
+    SequenceClassification,
+    TokenClassification,
+    SentenceEmbedding,
+    ImageClassification
+];
+
 #[derive(Debug)]
-pub struct EncoderfileState<T: ModelTypeSpec> {
+pub struct EncoderfileState<T: ModelTypeSpec + InputType + TaskType> {
     pub config: Config,
     pub session: Mutex<Session>,
-    pub tokenizer: TokenizerService,
-    pub model_config: ModelConfig,
+    pub per_model_input_state: T::InputState,
+    pub per_task_state: T::TaskState,
     pub lua_libs: Vec<mlua::StdLib>,
     _marker: PhantomData<T>,
 }
 
-impl<T: ModelTypeSpec> EncoderfileState<T> {
+impl<T: ModelTypeSpec + InputType + TaskType> EncoderfileState<T> {
     pub fn new(
         config: Config,
         session: Mutex<Session>,
-        tokenizer: TokenizerService,
-        model_config: ModelConfig,
+        per_model_input_state: T::InputState,
+        per_task_state: T::TaskState,
     ) -> EncoderfileState<T> {
         let lua_libs = match config.lua_libs {
             Some(ref libs) => Vec::<mlua::StdLib>::from(libs),
@@ -35,8 +173,8 @@ impl<T: ModelTypeSpec> EncoderfileState<T> {
         EncoderfileState {
             config,
             session,
-            tokenizer,
-            model_config,
+            per_model_input_state,
+            per_task_state,
             lua_libs,
             _marker: PhantomData,
         }
diff --git a/encoderfile/src/services/embedding.rs b/encoderfile/src/services/embedding.rs
index 53e89f7b..5d55b372 100644
--- a/encoderfile/src/services/embedding.rs
+++ b/encoderfile/src/services/embedding.rs
@@ -8,14 +8,15 @@ use crate::{
 
 use super::inference::Inference;
 
-impl Inference for AppState<model_type::Embedding> {
+impl Inference for AppState<model_type::Embedding>
+{
     type Input = EmbeddingRequest;
     type Output = EmbeddingResponse;
 
     fn inference(&self, request: impl Into<Self::Input>) -> Result<Self::Output, ApiError> {
         let request = request.into();
 
-        let encodings = self.tokenizer.encode_text(request.inputs)?;
+        let encodings = self.per_model_input_state.tokenizer.encode_text(request.inputs)?;
 
         let transform = EmbeddingTransform::new(self.lua_libs.clone(), self.transform_str())?;
 
diff --git a/encoderfile/src/services/image_classification.rs b/encoderfile/src/services/image_classification.rs
new file mode 100644
index 00000000..89ff988e
--- /dev/null
+++ b/encoderfile/src/services/image_classification.rs
@@ -0,0 +1,133 @@
+use crate::{
+    common::{
+        ImageClassificationRequest,
+        ImageClassificationResponse,
+        ImageClassificationResult,
+        model_type
+    },
+
+    error::ApiError,
+    runtime::AppState,
+};
+use image::RgbImage;
+use ndarray::{Array4, s};
+
+use super::inference::Inference;
+use crate::inference::image_classification::image_classification;
+
+// No service impl yet
+
+const DEFAULT_FILTER_TYPE: image::imageops::FilterType = image::imageops::FilterType::Triangle;
+
+impl Inference for AppState<model_type::ImageClassification>
+{
+    type Input = ImageClassificationRequest;
+    type Output = ImageClassificationResponse;
+
+    fn inference(&self, request: impl Into<Self::Input>) -> Result<Self::Output, ApiError> {
+        let request = request.into();
+        let rescale_factor = 0.00392156862745098 as f32;
+        let image_mean = 0.5;
+        let image_std = 0.5;
+        // bilinear resampling
+
+        // convert input image into flattened rbg
+        let images: Vec<RgbImage> = (&request.images).into_iter().map(|image_info| {
+            let img = image::load_from_memory(&image_info.image_bytes).expect("Failed to load image from bytes");
+            println!("Height x width: {:?} x {:?}", img.height(), img.width());
+            img
+                .resize_exact(
+                    self.per_model_input_state.width.unwrap(),
+                    self.per_model_input_state.height.unwrap(),
+                    DEFAULT_FILTER_TYPE
+                )
+                .to_rgb8()
+        }).collect();
+        let batch_size = request.images.len();
+        let num_channels = self.per_model_input_state.num_channels as usize;
+        let height = self.per_model_input_state.height.unwrap() as usize;
+        let width = self.per_model_input_state.width.unwrap() as usize;
+
+        if num_channels != 3 {
+            return Err(ApiError::InputError("Image classification currently expects 3 RGB channels"));
+        }
+
+        let mut images_array = Array4::<f32>::zeros((batch_size, num_channels, height, width));
+        for (image_idx, img) in images.into_iter().enumerate() {
+            let raw = img.into_raw();
+
+            // The image crate stores RGB bytes in HWC order; rewrite into NCHW.
+            for y in 0..height {
+                for x in 0..width {
+                    let pixel_offset = (y * width + x) * num_channels;
+                    for c in 0..num_channels {
+                        images_array[[image_idx, c, y, x]] = raw[pixel_offset + c] as f32;
+                    }
+                }
+            }
+        }
+        println!("Some sample slice of the input array (pre scale, post reshape): {:?}", images_array.slice(s![.., .., 0..5, 0..5]));
+        // TODO make parallel
+        images_array.mapv_inplace(|x| ((x * rescale_factor) - image_mean) / image_std);
+        println!("Some sample slice of the input array (post scale): {:?}", images_array.slice(s![.., .., 0..5, 0..5]));
+
+        let label_map = self.per_task_state.id2label.clone().unwrap();
+        let mut entries: Vec<_> = label_map.iter().collect();
+        entries.sort_by(|x, y| x.0.cmp(&y.0));
+        let classes: Vec<String> = entries.into_iter().map(|(_, label)| label.clone()).collect();
+
+        let labels_batch = image_classification(
+            self.session.lock(),
+            images_array,
+            // COMMENT having optional fields complicates things later on, but otoh
+            // it allows models with variations of these fields
+            classes)?;
+
+        Ok(ImageClassificationResponse {
+            results: labels_batch.iter().map(|labels| ImageClassificationResult { labels: labels.clone() }).collect(),
+            metadata: request.metadata,
+        })
+    }
+}
+
+#[cfg(test)]
+mod tests {
+    use crate::common::model_type::ImageClassification;
+    use crate::dev_utils;
+    use crate::common::ImageClassificationRequest;
+    use crate::common::FromReadInput;
+    use std::fs::File;
+    use std::sync::Once;
+    use super::*;
+
+    fn init_tracing() {
+        static TRACING: Once = Once::new();
+
+        TRACING.call_once(|| {
+            let _ = tracing_subscriber::fmt()
+                .with_env_filter(
+                    tracing_subscriber::EnvFilter::try_from_default_env()
+                        .unwrap_or_else(|_| tracing_subscriber::EnvFilter::new("debug,ort=warn")),
+                )
+                .with_test_writer()
+                .try_init();
+        });
+    }
+
+    #[test]
+    fn test_image_classification_request_from_file() {
+        init_tracing();
+
+        let state = dev_utils::get_state::<ImageClassification>("../models/image_classification");
+        let mut file = File::open("../test-pictures/w3c_home.jpg").expect("Failed to open test image");
+        let file_vec = vec![&mut file];
+        let request = ImageClassificationRequest::from_read_input(file_vec).expect("Failed to create request from read input");
+        let response = state.inference(request).expect("Inference failed");
+        assert_eq!(response.results.len(), 1);
+        assert_eq!(response.results[0].labels.len(), 2);
+        assert_eq!(response.results[0].labels[0].label, "normal");
+        assert_eq!(response.results[0].labels[0].score, Some(1.5378942));
+        assert_eq!(response.results[0].labels[1].label, "nsfw");
+        assert_eq!(response.results[0].labels[1].score, Some(-1.6556994));
+    }
+}
\ No newline at end of file
diff --git a/encoderfile/src/services/inference.rs b/encoderfile/src/services/inference.rs
index 5e55b15b..60fb0095 100644
--- a/encoderfile/src/services/inference.rs
+++ b/encoderfile/src/services/inference.rs
@@ -1,8 +1,9 @@
 use crate::{common::FromCliInput, error::ApiError, services::Metadata};
 
+// FIXME enforce the openapi schema later on
 pub trait Inference: Metadata {
-    type Input: FromCliInput + serde::de::DeserializeOwned + Sync + Send + utoipa::ToSchema;
-    type Output: serde::Serialize + Sync + Send + utoipa::ToSchema;
+    type Input: FromCliInput + serde::de::DeserializeOwned + Sync + Send /* + utoipa::ToSchema */;
+    type Output: serde::Serialize + Sync + Send /* + utoipa::ToSchema */;
 
     fn inference(&self, request: impl Into<Self::Input>) -> Result<Self::Output, ApiError>;
 }
diff --git a/encoderfile/src/services/mod.rs b/encoderfile/src/services/mod.rs
index 43720d50..6d88d6db 100644
--- a/encoderfile/src/services/mod.rs
+++ b/encoderfile/src/services/mod.rs
@@ -4,6 +4,7 @@ mod model_metadata;
 mod sentence_embedding;
 mod sequence_classification;
 mod token_classification;
+mod image_classification;
 
 pub use inference::Inference;
 pub use model_metadata::Metadata;
diff --git a/encoderfile/src/services/model_metadata.rs b/encoderfile/src/services/model_metadata.rs
index d43cc28d..483ca753 100644
--- a/encoderfile/src/services/model_metadata.rs
+++ b/encoderfile/src/services/model_metadata.rs
@@ -1,16 +1,19 @@
 use std::collections::HashMap;
 
 use crate::{
-    common::{GetModelMetadataResponse, ModelType, model_type::ModelTypeSpec},
-    runtime::AppState,
+    common::{GetModelMetadataResponse, model_type::{ModelType, ModelTypeSpec}}, runtime::{AppState, TaskType, InputType},
 };
 
+pub trait ClassifierMetadata {
+    fn id2label(&self) -> Option<HashMap<u32, String>>;
+}
+
 pub trait Metadata {
     fn metadata(&self) -> GetModelMetadataResponse {
         GetModelMetadataResponse {
             model_id: self.model_id(),
             model_type: self.model_type(),
-            id2label: self.id2label(),
+            id2label: None,
         }
     }
 
@@ -18,10 +21,9 @@ pub trait Metadata {
 
     fn model_type(&self) -> ModelType;
 
-    fn id2label(&self) -> Option<HashMap<u32, String>>;
 }
 
-impl<T: ModelTypeSpec> Metadata for AppState<T> {
+impl<T: ModelTypeSpec + InputType + TaskType> Metadata for AppState<T> {
     fn model_id(&self) -> String {
         self.config.name.clone()
     }
@@ -30,7 +32,4 @@ impl<T: ModelTypeSpec> Metadata for AppState<T> {
         T::enum_val()
     }
 
-    fn id2label(&self) -> Option<HashMap<u32, String>> {
-        self.model_config.id2label.clone()
-    }
 }
diff --git a/encoderfile/src/services/sentence_embedding.rs b/encoderfile/src/services/sentence_embedding.rs
index 115c6322..08e812a8 100644
--- a/encoderfile/src/services/sentence_embedding.rs
+++ b/encoderfile/src/services/sentence_embedding.rs
@@ -8,14 +8,15 @@ use crate::{
 
 use super::inference::Inference;
 
-impl Inference for AppState<model_type::SentenceEmbedding> {
+impl Inference for AppState<model_type::SentenceEmbedding>
+{
     type Input = SentenceEmbeddingRequest;
     type Output = SentenceEmbeddingResponse;
 
     fn inference(&self, request: impl Into<Self::Input>) -> Result<Self::Output, ApiError> {
         let request = request.into();
 
-        let encodings = self.tokenizer.encode_text(request.inputs)?;
+        let encodings = self.per_model_input_state.tokenizer.encode_text(request.inputs)?;
 
         let transform =
             SentenceEmbeddingTransform::new(self.lua_libs.clone(), self.transform_str())?;
diff --git a/encoderfile/src/services/sequence_classification.rs b/encoderfile/src/services/sequence_classification.rs
index 52af7313..4911afbe 100644
--- a/encoderfile/src/services/sequence_classification.rs
+++ b/encoderfile/src/services/sequence_classification.rs
@@ -8,14 +8,15 @@ use crate::{
 
 use super::inference::Inference;
 
-impl Inference for AppState<model_type::SequenceClassification> {
+impl Inference for AppState<model_type::SequenceClassification>
+{
     type Input = SequenceClassificationRequest;
     type Output = SequenceClassificationResponse;
 
     fn inference(&self, request: impl Into<Self::Input>) -> Result<Self::Output, ApiError> {
         let request = request.into();
 
-        let encodings = self.tokenizer.encode_text(request.inputs)?;
+        let encodings = self.per_model_input_state.tokenizer.encode_text(request.inputs)?;
 
         let transform =
             SequenceClassificationTransform::new(self.lua_libs.clone(), self.transform_str())?;
@@ -23,7 +24,7 @@ impl Inference for AppState<model_type::SequenceClassification> {
         let results = inference::sequence_classification::sequence_classification(
             self.session.lock(),
             &transform,
-            &self.model_config,
+            &self.per_task_state,
             encodings,
         )?;
 
diff --git a/encoderfile/src/services/token_classification.rs b/encoderfile/src/services/token_classification.rs
index 2fd12329..0d4d5a62 100644
--- a/encoderfile/src/services/token_classification.rs
+++ b/encoderfile/src/services/token_classification.rs
@@ -8,7 +8,8 @@ use crate::{
 
 use super::inference::Inference;
 
-impl Inference for AppState<model_type::TokenClassification> {
+impl Inference for AppState<model_type::TokenClassification>
+{
     type Input = TokenClassificationRequest;
     type Output = TokenClassificationResponse;
 
@@ -17,7 +18,7 @@ impl Inference for AppState<model_type::TokenClassification> {
 
         let session = self.session.lock();
 
-        let encodings = self.tokenizer.encode_text(request.inputs)?;
+        let encodings = self.per_model_input_state.tokenizer.encode_text(request.inputs)?;
 
         let transform =
             TokenClassificationTransform::new(self.lua_libs.clone(), self.transform_str())?;
@@ -25,7 +26,7 @@ impl Inference for AppState<model_type::TokenClassification> {
         let results = inference::token_classification::token_classification(
             session,
             &transform,
-            &self.model_config,
+            &self.per_task_state,
             encodings,
         )?;
 
diff --git a/encoderfile/src/transforms/engine/image_classification.rs b/encoderfile/src/transforms/engine/image_classification.rs
new file mode 100644
index 00000000..6da82b8c
--- /dev/null
+++ b/encoderfile/src/transforms/engine/image_classification.rs
@@ -0,0 +1,140 @@
+use crate::{common::model_type, error::ApiError};
+
+use super::{super::tensor::Tensor, Postprocessor, Transform};
+use ndarray::{Array2, Ix2};
+
+impl Postprocessor for Transform<model_type::ImageClassification> {
+    type Input = Array2<f32>;
+    type Output = Array2<f32>;
+
+    fn postprocess(&self, data: Self::Input) -> Result<Self::Output, ApiError> {
+        let func = match self.postprocessor() {
+            Some(p) => p,
+            None => return Ok(data),
+        };
+
+        let expected_shape = data.shape().to_owned();
+
+        let tensor = Tensor(data.into_dyn());
+
+        let result = func
+            .call::<Tensor>(tensor)
+            .map_err(|e| ApiError::LuaError(e.to_string()))?
+            .into_inner()
+            .into_dimensionality::<Ix2>().map_err(|e| {
+                tracing::error!("Failed to cast array into Ix2: {e}. Check your lua transform to make sure it returns a tensor of shape [batch_size, num_classes]");
+                ApiError::LuaError("Error postprocessing image classifications".to_string())
+            })?;
+
+        let result_shape = result.shape();
+
+        if expected_shape.as_slice() != result_shape {
+            tracing::error!(
+                "Transform error: expected tensor of shape {:?}, got tensor of shape {:?}",
+                expected_shape.as_slice(),
+                result_shape
+            );
+
+            return Err(ApiError::LuaError(
+                "Error postprocessing image classifications".to_string(),
+            ));
+        }
+
+        Ok(result)
+    }
+}
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+    use crate::transforms::DEFAULT_LIBS;
+
+    #[test]
+    fn test_image_cls_no_transform() {
+        let engine = Transform::<model_type::ImageClassification>::new(
+            DEFAULT_LIBS.to_vec(),
+            Some("".to_string()),
+        )
+        .expect("Failed to create Transform");
+
+        let arr = ndarray::Array2::<f32>::from_elem((32, 16), 2.0);
+
+        let result = engine.postprocess(arr.clone()).expect("Failed");
+
+        assert_eq!(arr, result);
+    }
+
+    #[test]
+    fn test_image_cls_identity_transform() {
+        let engine = Transform::<model_type::ImageClassification>::new(
+            DEFAULT_LIBS.to_vec(),
+            Some(
+                r##"
+        function Postprocess(arr)
+            return arr
+        end
+        "##
+                .to_string(),
+            ),
+        )
+        .expect("Failed to create engine");
+
+        let arr = ndarray::Array2::<f32>::from_elem((16, 32), 2.0);
+
+        let result = engine.postprocess(arr.clone()).expect("Failed");
+
+        assert_eq!(arr, result);
+    }
+
+    #[test]
+    fn test_image_cls_transform_bad_fn() {
+        let engine = Transform::<model_type::ImageClassification>::new(
+            DEFAULT_LIBS.to_vec(),
+            Some(
+                r##"
+        function Postprocess(arr)
+            return 1
+        end
+        "##
+                .to_string(),
+            ),
+        )
+        .expect("Failed to create engine");
+
+        let arr = ndarray::Array2::<f32>::from_elem((16, 32), 2.0);
+
+        let result = engine.postprocess(arr.clone());
+
+        assert!(result.is_err())
+    }
+
+    #[test]
+    fn test_bad_dimensionality_transform_postprocessing() {
+        let engine = Transform::<model_type::ImageClassification>::new(
+            DEFAULT_LIBS.to_vec(),
+            Some(
+                r##"
+        function Postprocess(x)
+            return x:sum_axis(1)
+        end
+        "##
+                .to_string(),
+            ),
+        )
+        .unwrap();
+
+        let arr = ndarray::Array2::<f32>::from_elem((3, 3), 2.0);
+        let result = engine.postprocess(arr.clone());
+
+        assert!(result.is_err());
+
+        if let Err(e) = result {
+            match e {
+                ApiError::LuaError(s) => {
+                    assert!(s.contains("Error postprocessing image classifications"))
+                }
+                _ => panic!("Didn't return lua error"),
+            }
+        }
+    }
+}
diff --git a/encoderfile/src/transforms/engine/mod.rs b/encoderfile/src/transforms/engine/mod.rs
index 73cee6e2..3a4510ee 100644
--- a/encoderfile/src/transforms/engine/mod.rs
+++ b/encoderfile/src/transforms/engine/mod.rs
@@ -16,6 +16,7 @@ mod embedding;
 mod sentence_embedding;
 mod sequence_classification;
 mod token_classification;
+mod image_classification;
 
 impl From<&LuaLibs> for Vec<mlua::StdLib> {
     fn from(value: &LuaLibs) -> Self {
@@ -86,6 +87,7 @@ transform!(EmbeddingTransform, Embedding);
 transform!(SequenceClassificationTransform, SequenceClassification);
 transform!(TokenClassificationTransform, TokenClassification);
 transform!(SentenceEmbeddingTransform, SentenceEmbedding);
+transform!(ImageClassificationTransform, ImageClassification);
 
 pub trait Postprocessor: TransformSpec {
     type Input;
diff --git a/encoderfile/src/transport/cli.rs b/encoderfile/src/transport/cli.rs
index 48c73b60..e054db72 100644
--- a/encoderfile/src/transport/cli.rs
+++ b/encoderfile/src/transport/cli.rs
@@ -46,13 +46,13 @@ pub trait CliRoute: Inference {
 impl<T: Inference> CliRoute for T {}
 
 #[derive(Parser)]
-pub struct Cli {
+pub struct TextCli {
     #[command(subcommand)]
-    pub command: Commands,
+    pub command: TextCommands,
 }
 
 #[derive(Subcommand)]
-pub enum Commands {
+pub enum TextCommands {
     Serve {
         #[arg(long, default_value = "[::]")]
         grpc_hostname: String,
@@ -95,13 +95,13 @@ pub enum Commands {
     },
 }
 
-impl Commands {
+impl TextCommands {
     pub async fn execute<S>(self, state: S) -> Result<()>
     where
         S: Inference + GrpcRouter + HttpRouter + McpRouter + CliRoute,
     {
         match self {
-            Commands::Serve {
+            TextCommands::Serve {
                 grpc_hostname,
                 grpc_port,
                 http_hostname,
@@ -152,7 +152,7 @@ impl Commands {
 
                 let _ = tokio::join!(grpc_process, http_process);
             }
-            Commands::Infer {
+            TextCommands::Infer {
                 inputs,
                 format,
                 out_dir,
@@ -161,7 +161,7 @@ impl Commands {
 
                 state.cli_route(inputs, format, out_dir)?
             }
-            Commands::Mcp {
+            TextCommands::Mcp {
                 hostname,
                 port,
                 cert_file,
@@ -177,6 +177,117 @@ impl Commands {
     }
 }
 
+#[derive(Parser)]
+pub struct ImageCli {
+    #[command(subcommand)]
+    pub command: ImageCommands,
+}
+
+#[derive(Subcommand)]
+pub enum ImageCommands {
+    Serve {
+        #[arg(long, default_value = "[::]")]
+        grpc_hostname: String,
+        #[arg(long, default_value = "50051")]
+        grpc_port: String,
+        #[arg(long, default_value = "0.0.0.0")]
+        http_hostname: String,
+        #[arg(long, default_value = "8080")]
+        http_port: String,
+        #[arg(long, default_value_t = false)]
+        disable_grpc: bool,
+        #[arg(long, default_value_t = false)]
+        disable_http: bool,
+        #[arg(long, default_value_t = false)]
+        enable_otel: bool,
+        #[arg(long, default_value = "http://localhost:4317")]
+        otel_exporter_url: String,
+        #[arg(long)]
+        cert_file: Option<String>,
+        #[arg(long)]
+        key_file: Option<String>,
+    },
+    Infer {
+        #[arg(required = true)]
+        inputs: Vec<String>,
+        #[arg(short, long, default_value_t = Format::Json)]
+        format: Format,
+        #[arg(short)]
+        out_dir: Option<String>,
+    },
+}
+
+impl ImageCommands {
+    pub async fn execute<S>(self, state: S) -> Result<()>
+    where
+        S: Inference + GrpcRouter + HttpRouter + CliRoute,
+    {
+        match self {
+            ImageCommands::Serve {
+                grpc_hostname,
+                grpc_port,
+                http_hostname,
+                http_port,
+                disable_grpc,
+                disable_http,
+                enable_otel,
+                otel_exporter_url,
+                cert_file,
+                key_file,
+            } => {
+                let banner = crate::get_banner(state.model_id().as_str());
+
+                if disable_grpc && disable_http {
+                    return Err(crate::error::ApiError::ConfigError(
+                        "Cannot disable both gRPC and HTTP",
+                    ))?;
+                }
+
+                match enable_otel {
+                    true => setup_tracing(Some(otel_exporter_url.as_str())),
+                    false => setup_tracing(None),
+                }?;
+
+                let grpc_process = match disable_grpc {
+                    true => tokio::spawn(async { Ok(()) }),
+                    false => tokio::spawn(run_grpc(
+                        grpc_hostname,
+                        grpc_port,
+                        cert_file.clone(),
+                        key_file.clone(),
+                        state.clone(),
+                    )),
+                };
+
+                let http_process = match disable_http {
+                    true => tokio::spawn(async { Ok(()) }),
+                    false => tokio::spawn(run_http(
+                        http_hostname,
+                        http_port,
+                        cert_file.clone(),
+                        key_file.clone(),
+                        state.clone(),
+                    )),
+                };
+
+                println!("{}", banner);
+
+                let _ = tokio::join!(grpc_process, http_process);
+            }
+            ImageCommands::Infer {
+                inputs,
+                format,
+                out_dir,
+            } => {
+                setup_tracing(None)?;
+
+                state.cli_route(inputs, format, out_dir)?
+            }
+        }
+        Ok(())
+    }
+}
+
 #[derive(Clone, ValueEnum)]
 pub enum Format {
     Json,
diff --git a/encoderfile/src/transport/grpc/mod.rs b/encoderfile/src/transport/grpc/mod.rs
index 162de39a..871b5c3f 100644
--- a/encoderfile/src/transport/grpc/mod.rs
+++ b/encoderfile/src/transport/grpc/mod.rs
@@ -1,6 +1,6 @@
 use crate::{
     common::model_type,
-    generated::{embedding, sentence_embedding, sequence_classification, token_classification},
+    generated::{embedding, sentence_embedding, sequence_classification, token_classification, image_classification},
     runtime::AppState,
     services::{Inference, Metadata},
 };
@@ -116,3 +116,13 @@ generate_grpc_server!(
     SentenceEmbeddingInference,
     SentenceEmbeddingInferenceServer
 );
+
+generate_grpc_server!(
+    ImageClassification,
+    image_classification,
+    image_classification_inference_server,
+    ImageClassificationRequest,
+    ImageClassificationResponse,
+    ImageClassificationInference,
+    ImageClassificationInferenceServer
+);
diff --git a/encoderfile/src/transport/http/example.md b/encoderfile/src/transport/http/example.md
new file mode 100644
index 00000000..3eb1bfc9
--- /dev/null
+++ b/encoderfile/src/transport/http/example.md
@@ -0,0 +1,316 @@
+# Multipart OpenAPI Service Example
+
+This document provides examples of how to interact with the multipart file upload and prediction endpoint.
+
+## Endpoint Overview
+
+- **POST /predict/multipart** - Submit a JSON payload with binary file attachments
+- **GET /predict/multipart/openapi.json** - Retrieve the OpenAPI specification
+
+## Example 1: cURL with Two Image Files
+
+```bash
+curl -X POST http://localhost:8080/predict/multipart \
+  -F "payload={\"model_version\": \"1.0\", \"threshold\": 0.8}" \
+  -F "files=@/path/to/image1.png" \
+  -F "files=@/path/to/image2.jpg"
+```
+
+### Request Body (multipart/form-data)
+
+```
+--boundary_123abc456def
+Content-Disposition: form-data; name="payload"
+Content-Type: application/json
+
+{"model_version": "1.0", "threshold": 0.8}
+--boundary_123abc456def
+Content-Disposition: form-data; name="files"; filename="image1.png"
+Content-Type: image/png
+
+<binary PNG data here>
+--boundary_123abc456def
+Content-Disposition: form-data; name="files"; filename="image2.jpg"
+Content-Type: image/jpeg
+
+<binary JPG data here>
+--boundary_123abc456def--
+```
+
+### Response
+
+```json
+{
+  "payload": {
+    "model_version": "1.0",
+    "threshold": 0.8
+  },
+  "attachment_count": 2,
+  "attachments": [
+    {
+      "file_name": "image1.png",
+      "content_type": "image/png",
+      "size_bytes": 45230
+    },
+    {
+      "file_name": "image2.jpg",
+      "content_type": "image/jpeg",
+      "size_bytes": 52104
+    }
+  ]
+}
+```
+
+## Example 2: Python Requests Library
+
+```python
+import requests
+import json
+
+url = "http://localhost:8080/predict/multipart"
+
+# Prepare the payload
+payloaquest Body (multipart/form-data)
+
+```
+--boundary_xyz789pqr012
+Content-Disposition: form-data; name="payload"; filename="payload.json"
+Content-Type: application/json
+
+{"model_version": "1.0", "threshold": 0.8, "batch_id": "batch_12345"}
+--boundary_xyz789pqr012
+Content-Disposition: form-data; name="files"; filename="image1.png"
+Content-Type: image/png
+
+<binary PNG data>
+--boundary_xyz789pqr012
+Content-Disposition: form-data; name="files"; filename="image2.jpg"
+Content-Type: image/jpeg
+
+<binary JPG data>
+--boundary_xyz789pqr012
+Content-Disposition: form-data; name="files"; filename="document.pdf"
+Content-Type: application/pdf
+
+<binary PDF data>
+--boundary_xyz789pqr012--
+```
+
+### Red = {
+    "model_version": "1.0",
+    "threshold": 0.8,
+    "batch_id": "batch_12345"
+}
+
+# Prepare files
+files = [
+    ("payload", ("payload.json", json.dumps(payload), "application/json")),
+    ("files", ("image1.png", open("image1.png", "rb"), "image/png")),
+    ("files", ("image2.jpg", open("image2.jpg", "rb"), "image/jpeg")),
+    ("files", ("document.pdf", open("document.pdf", "rb"), "application/pdf")),
+]
+
+# Send the request
+response = requests.post(url, files=files)
+
+print("Status Code:", response.status_code)
+print("Response:", response.json())
+```
+
+### Response
+
+```json
+{
+  "payload": {
+    "model_version": "1.0",
+    "threshold": 0.8,
+    "batch_id": "batch_12345"
+  },
+  "attachment_count": 3,
+  "attachments": [
+    {
+      "file_name": "image1.png",
+      "content_type": "image/png",
+      quest Body (multipart/form-data)
+
+```
+--boundary_webkit_abc123
+Content-Disposition: form-data; name="payload"
+
+{"model_version":"1.0","threshold":0.8,"inference_id":"inf_abc123"}
+--boundary_webkit_abc123
+Content-Disposition: form-data; name="files"; filename="photo1.jpg"
+Content-Type: image/jpeg
+
+<binary JPG data>
+--boundary_webkit_abc123
+Content-Disposition: form-data; name="files"; filename="photo2.jpg"
+Content-Type: image/jpeg
+
+<binary JPG data>
+--boundary_webkit_abc123--
+```
+
+### Re"size_bytes": 45230
+    },
+    {
+      "file_name": "image2.jpg",
+      "content_type": "image/jpeg",
+      "size_bytes": 52104
+    },
+    {
+      "file_name": "document.pdf",
+      "content_type": "application/pdf",
+      "size_bytes": 128512
+    }
+  ]
+}
+```
+
+## Example 3: JavaScript Fetch API
+
+```javascript
+const payload = {
+  model_version: "1.0",
+  threshold: 0.8,
+  inference_id: "inf_abc123"
+};
+
+const formData = new FormData();
+
+// Add the JSON payload as a form field
+formData.append("payload", JSON.stringify(payload));
+
+// Add multiple binary files
+const imageFile1 = document.getElementById("imageInput1").files[0];
+const imageFile2 = document.getElementById("imageInput2").files[0];
+
+formData.append("files", imageFile1);
+formData.append("files", imageFile2);
+
+// Make the request
+const response = await fetch("http://localhost:8080/predict/multipart", {
+  method: "POST",
+  body: formData
+});
+
+const result = await response.json();
+console.log("Success:", result);
+```
+
+### Response
+
+```json
+{
+  "payload": {
+    "model_version": "1.0",
+    "threshold": 0.8,
+    "inference_id": "inf_abc123"
+  },
+  "attachment_count": 2,
+  "attachments": [
+    {
+      "file_name": "photo1.jpg",
+      "content_type": "image/jpeg",
+      "size_bytes": 245120
+    },
+    {
+      "file_name": "photo2.jpg",
+      "content_type": "image/jpeg",
+      "size_bytes": 187904
+    }
+  ]
+}
+```
+
+## Example 4: Error Handling
+
+### Missing Payload
+
+If the request is sent without a `payload` form field:
+
+```bash
+curl -X POST http://localhost:8080/predict/multipart \
+  -F "files=@/path/to/image.png"
+```
+
+**Response (422 Unprocessable Entity):**
+
+```
+missing required multipart field 'payload'
+```
+
+### Invalid JSON in Payload
+
+If the payload field contains invalid JSON:
+
+```bash
+curl -X POST http://localhost:8080/predict/multipart \
+  -F "payload=not valid json" \
+  -F "files=@/path/to/image.png"
+```
+
+**Response (422 Unprocessable Entity):**
+
+```
+invalid json in 'payload' field
+```
+
+### Malformed Multipart Body
+
+If the multipart encoding is corrupted:
+
+**Response (400 Bad Request):**
+
+```
+multipart parse error: [error details]
+```
+
+## Request Parts Specification
+
+### Required: `payload` Part
+
+- **Name**: `payload` (exactly one)
+- **Content-Type**: `application/json` (recommended)
+- **Content**: Valid JSON object or array
+
+### Optional: `files` Parts
+
+- **Name**: `files` (zero or more)
+- **Content-Type**: Any MIME type (e.g., `image/png`, `application/pdf`)
+- **Content**: Binary data
+- **Filename**: Optional but recommended (used in response metadata)
+
+## Response Structure
+
+```json
+{
+  "payload": "...",                 // Echo of the submitted JSON payload
+  "attachment_count": 3,            // Number of files attached
+  "attachments": [                  // Metadata for each file
+    {
+      "file_name": "...",           // Original filename if provided, null otherwise
+      "content_type": "...",        // MIME type if provided, null otherwise
+      "size_bytes": 12345           // File size in bytes
+    }
+  ]
+}
+```
+
+## HTTP Status Codes
+
+| Status | Meaning | Condition |
+|--------|---------|-----------|
+| 200 | OK | Request processed successfully |
+| 400 | Bad Request | Malformed multipart body |
+| 422 | Unprocessable Entity | Missing `payload` or invalid JSON |
+
+## OpenAPI Specification
+
+To retrieve the OpenAPI specification for this endpoint:
+
+```bash
+curl -X GET http://localhost:8080/predict/multipart/openapi.json
+```
+
+This returns a machine-readable OpenAPI 3.0 document describing the endpoint.
diff --git a/encoderfile/src/transport/http/mod.rs b/encoderfile/src/transport/http/mod.rs
index f5b5ffd1..cc526318 100644
--- a/encoderfile/src/transport/http/mod.rs
+++ b/encoderfile/src/transport/http/mod.rs
@@ -1,5 +1,6 @@
 mod base;
 mod error;
+pub mod multipart_openapi;
 
 pub trait HttpRouter
 where
diff --git a/encoderfile/src/transport/http/multipart_openapi.rs b/encoderfile/src/transport/http/multipart_openapi.rs
new file mode 100644
index 00000000..6b5d11b8
--- /dev/null
+++ b/encoderfile/src/transport/http/multipart_openapi.rs
@@ -0,0 +1,282 @@
+use axum::{
+    Json,
+    extract::{Multipart, State},
+    http::StatusCode,
+    response::{IntoResponse, Response},
+};
+use serde::{Deserialize, Serialize};
+use utoipa::OpenApi;
+use crate::common::model_type::ImageClassification;
+use crate::runtime::AppState;
+
+pub const MULTIPART_PREDICT_ENDPOINT: &str = "/predict/multipart";
+pub const MULTIPART_OPENAPI_ENDPOINT: &str = "/predict/multipart/openapi.json";
+
+#[derive(Debug, Serialize, Deserialize, utoipa::ToSchema)]
+pub struct MultipartPredictBody {
+    /// Arbitrary JSON payload sent in the multipart part named `payload`.
+    pub payload: serde_json::Value,
+
+    /// Binary attachments sent as repeated `files` multipart parts.
+    #[schema(value_type = Vec<String>)]
+    pub files: Vec<String>,
+}
+
+#[derive(Debug, Serialize, Deserialize, utoipa::ToSchema)]
+pub struct ParsedAttachment {
+    pub file_name: Option<String>,
+    pub content_type: Option<String>,
+    pub size_bytes: usize,
+}
+
+#[derive(Debug, Serialize, Deserialize, utoipa::ToSchema, utoipa::ToResponse)]
+pub struct MultipartPredictResponse {
+    pub payload: serde_json::Value,
+    pub attachment_count: usize,
+    pub attachments: Vec<ParsedAttachment>,
+}
+
+#[derive(Debug, thiserror::Error)]
+pub enum MultipartApiError {
+    #[error("missing required multipart field 'payload'")]
+    MissingPayload,
+    #[error("invalid json in 'payload' field")]
+    InvalidPayload,
+    #[error("multipart parse error: {0}")]
+    Multipart(String),
+    #[error("failed to construct request from multipart: {0}")]
+    RequestConstruction(String),
+}
+
+impl IntoResponse for MultipartApiError {
+    fn into_response(self) -> Response {
+        let status = match self {
+            Self::MissingPayload | Self::InvalidPayload => StatusCode::UNPROCESSABLE_ENTITY,
+            Self::RequestConstruction(_) => StatusCode::UNPROCESSABLE_ENTITY,
+            Self::Multipart(_) => StatusCode::BAD_REQUEST,
+        };
+
+        (status, self.to_string()).into_response()
+    }
+}
+
+/// Trait for converting multipart payload and attachments into a typed request.
+pub trait FromMultipart: Sized {
+    /// Construct an instance from a JSON payload and list of attachment bytes.
+    fn from_multipart(
+        payload: serde_json::Value,
+        attachments: Vec<(Option<String>, Option<String>, bytes::Bytes)>,
+    ) -> Result<Self, MultipartApiError>;
+}
+
+#[derive(Debug, utoipa::OpenApi)]
+#[openapi(paths(post_multipart), components(schemas(MultipartPredictBody, MultipartPredictResponse, ParsedAttachment)))]
+pub struct MultipartApiDoc;
+
+#[utoipa::path(
+    get,
+    path = MULTIPART_OPENAPI_ENDPOINT,
+    responses(
+        (status = 200, description = "Successful")
+    )
+)]
+pub async fn openapi() -> impl IntoResponse {
+    Json(MultipartApiDoc::openapi())
+}
+
+#[utoipa::path(
+    post,
+    path = MULTIPART_PREDICT_ENDPOINT,
+    request_body(
+        content = MultipartPredictBody,
+        content_type = "multipart/form-data",
+        description = "Multipart payload with a JSON part named 'payload' and 0..N binary parts named 'files'"
+    ),
+    responses(
+        (status = 200, body = MultipartPredictResponse),
+        (status = 422, description = "Missing or invalid payload JSON"),
+        (status = 400, description = "Invalid multipart body")
+    )
+)]
+pub async fn post_multipart(
+    mut multipart: Multipart,
+) -> Result<Json<MultipartPredictResponse>, MultipartApiError> {
+    parse_multipart(&mut multipart).await
+}
+
+/// Generic multipart parser that extracts payload and attachments.
+pub async fn parse_multipart(
+    multipart: &mut Multipart,
+) -> Result<Json<MultipartPredictResponse>, MultipartApiError> {
+    let mut payload: Option<serde_json::Value> = None;
+    let mut attachments = Vec::new();
+    let mut attachment_metadata = Vec::new();
+
+    while let Some(field) = multipart
+        .next_field()
+        .await
+        .map_err(|e| MultipartApiError::Multipart(e.to_string()))?
+    {
+        let name = field.name().map(ToOwned::to_owned);
+        let file_name = field.file_name().map(ToOwned::to_owned);
+        let content_type = field.content_type().map(ToOwned::to_owned);
+        let bytes = field
+            .bytes()
+            .await
+            .map_err(|e| MultipartApiError::Multipart(e.to_string()))?;
+
+        match name.as_deref() {
+            Some("payload") => {
+                payload = Some(
+                    serde_json::from_slice(&bytes).map_err(|_| MultipartApiError::InvalidPayload)?,
+                );
+            }
+            Some("files") => {
+                attachment_metadata.push(ParsedAttachment {
+                    file_name: file_name.clone(),
+                    content_type: content_type.clone(),
+                    size_bytes: bytes.len(),
+                });
+                attachments.push((file_name, content_type, bytes));
+            }
+            _ => {}
+        }
+    }
+
+    let payload = payload.ok_or(MultipartApiError::MissingPayload)?;
+
+    Ok(Json(MultipartPredictResponse {
+        payload,
+        attachment_count: attachment_metadata.len(),
+        attachments: attachment_metadata,
+    }))
+}
+
+/// Generic handler that converts multipart request into typed request.
+pub async fn post_multipart_typed<R: FromMultipart>(
+    mut multipart: Multipart,
+) -> Result<Json<MultipartPredictResponse>, MultipartApiError> {
+    let mut payload: Option<serde_json::Value> = None;
+    let mut attachments = Vec::new();
+    let mut attachment_metadata = Vec::new();
+
+    while let Some(field) = multipart
+        .next_field()
+        .await
+        .map_err(|e| MultipartApiError::Multipart(e.to_string()))?
+    {
+        let name = field.name().map(ToOwned::to_owned);
+        let file_name = field.file_name().map(ToOwned::to_owned);
+        let content_type = field.content_type().map(ToOwned::to_owned);
+        let bytes = field
+            .bytes()
+            .await
+            .map_err(|e| MultipartApiError::Multipart(e.to_string()))?;
+
+        match name.as_deref() {
+            Some("payload") => {
+                payload = Some(
+                    serde_json::from_slice(&bytes).map_err(|_| MultipartApiError::InvalidPayload)?,
+                );
+            }
+            Some("files") => {
+                attachment_metadata.push(ParsedAttachment {
+                    file_name: file_name.clone(),
+                    content_type: content_type.clone(),
+                    size_bytes: bytes.len(),
+                });
+                attachments.push((file_name, content_type, bytes));
+            }
+            _ => {}
+        }
+    }
+
+    let payload = payload.ok_or(MultipartApiError::MissingPayload)?;
+
+    // Convert to typed request
+    let _request: R = R::from_multipart(payload.clone(), attachments)?;
+
+    Ok(Json(MultipartPredictResponse {
+        payload,
+        attachment_count: attachment_metadata.len(),
+        attachments: attachment_metadata,
+    }))
+}
+
+pub fn router() -> axum::Router {
+    axum::Router::new()
+        .route(MULTIPART_PREDICT_ENDPOINT, axum::routing::post(post_multipart))
+        .route(MULTIPART_OPENAPI_ENDPOINT, axum::routing::get(openapi))
+}
+
+/// HttpRouter implementation for ImageClassification model type.
+/// Combines standard model serving endpoints with multipart file upload capability.
+impl super::HttpRouter for crate::runtime::AppState<ImageClassification> {
+    fn http_router(self) -> axum::Router {
+        axum::Router::new()
+            .route("/health", axum::routing::get(super::base::health))
+            .route(
+                "/model",
+                axum::routing::get(super::base::get_model_metadata::<Self>),
+            )
+            .route("/predict", axum::routing::post(predict_handler))
+            .route("/openapi.json", axum::routing::get(standard_openapi))
+            .route(
+                MULTIPART_PREDICT_ENDPOINT,
+                axum::routing::post(post_multipart_image_classification),
+            )
+            .route(MULTIPART_OPENAPI_ENDPOINT, axum::routing::get(openapi))
+            .with_state(self)
+    }
+}
+
+/// Multipart handler specialized for ImageClassificationRequest.
+async fn post_multipart_image_classification(
+    multipart: Multipart,
+) -> Result<Json<MultipartPredictResponse>, MultipartApiError> {
+    post_multipart_typed::<crate::common::ImageClassificationRequest>(multipart).await
+}
+
+/// Standard predict endpoint for ImageClassification.
+async fn predict_handler(
+    State(state): State<AppState<ImageClassification>>,
+    Json(req): Json<
+        <AppState<ImageClassification> as crate::services::Inference>::Input,
+    >,
+) -> impl IntoResponse {
+    super::base::predict(State(state), Json(req)).await
+}
+
+/// Standard OpenAPI endpoint for ImageClassification model service (without multipart).
+async fn standard_openapi() -> impl IntoResponse {
+    Json(serde_json::json!({
+        "openapi": "3.0.0",
+        "info": {
+            "title": "ImageClassification Model API",
+            "version": "1.0.0"
+        },
+        "paths": {
+            "/health": {
+                "get": {
+                    "responses": {
+                        "200": { "description": "Successful" }
+                    }
+                }
+            },
+            "/model": {
+                "get": {
+                    "responses": {
+                        "200": { "description": "Successful" }
+                    }
+                }
+            },
+            "/predict": {
+                "post": {
+                    "responses": {
+                        "200": { "description": "Successful" }
+                    }
+                }
+            }
+        }
+    }))
+}
diff --git a/encoderfile/src/transport/mcp/mod.rs b/encoderfile/src/transport/mcp/mod.rs
index 4512c711..e61bccbb 100644
--- a/encoderfile/src/transport/mcp/mod.rs
+++ b/encoderfile/src/transport/mcp/mod.rs
@@ -151,3 +151,16 @@ generate_mcp!(
     "Performs sentence embedding of input text sequences.",
     "This tool will embed a sequence of texts."
 );
+
+// Doesn't use a json schema, see how we can go around this limitation
+/*
+generate_mcp!(
+    ImageClassification,
+    ImageClassificationTool,
+    image_classification,
+    ImageClassificationRequest,
+    ImageClassificationResponse,
+    "Performs image classification of input images.",
+    "This tool will classify input images."
+);
+*/
\ No newline at end of file
diff --git a/encoderfile/tests/test_mcp.rs b/encoderfile/tests/test_mcp.rs
index 55ac6ab0..8608f5b2 100644
--- a/encoderfile/tests/test_mcp.rs
+++ b/encoderfile/tests/test_mcp.rs
@@ -5,8 +5,9 @@ use encoderfile::transport::mcp::McpRouter;
 use tokio::net::TcpListener;
 use tokio::sync::oneshot;
 use tower_http::trace::DefaultOnResponse;
+use encoderfile::runtime::{InputType, TaskType};
 
-async fn run_mcp<T: ModelTypeSpec>(
+async fn run_mcp<T: ModelTypeSpec + InputType + TaskType>(
     addr: String,
     state: AppState<T>,
     shutdown_receiver: oneshot::Receiver<()>,
diff --git a/encoderfile/tests/test_model_validation.rs b/encoderfile/tests/test_model_validation.rs
index 25d971b4..11d819c6 100644
--- a/encoderfile/tests/test_model_validation.rs
+++ b/encoderfile/tests/test_model_validation.rs
@@ -1,6 +1,6 @@
 use std::path::PathBuf;
 
-use encoderfile::{builder::model::ModelTypeExt as _, common::ModelType};
+use encoderfile::{builder::model::ModelTypeExt as _, common::model_type::ModelType};
 
 #[test]
 pub fn test_embedding() {
@@ -45,3 +45,16 @@ pub fn test_sequence_classification() {
             .is_ok()
     );
 }
+
+#[test]
+pub fn test_image_classification() {
+    let path = PathBuf::from("../models/image_classification/model.onnx");
+
+    assert!(ModelType::ImageClassification.validate_model(&path).is_ok());
+    assert!(
+        ModelType::TokenClassification
+            .validate_model(&path)
+            .is_err()
+    );
+}
+
diff --git a/encoderfile/tests/test_models.rs b/encoderfile/tests/test_models.rs
index 44718dc0..c95840cc 100644
--- a/encoderfile/tests/test_models.rs
+++ b/encoderfile/tests/test_models.rs
@@ -4,12 +4,14 @@ use encoderfile::inference::{
     token_classification::token_classification,
 };
 use encoderfile::transforms::{DEFAULT_LIBS, Transform};
+use encoderfile::runtime::{InputType, TaskType};
 
 #[test]
 fn test_embedding_model() {
     let state = embedding_state();
 
     let encodings = state
+        .per_model_input_state
         .tokenizer
         .encode_text(vec![
             "hello world".to_string(),
@@ -34,6 +36,7 @@ fn test_embedding_inference_with_bad_model() {
     let state = token_classification_state();
 
     let encodings = state
+        .per_model_input_state
         .tokenizer
         .encode_text(vec![
             "hello world".to_string(),
@@ -54,6 +57,7 @@ fn test_sequence_classification_model() {
     let state = sequence_classification_state();
 
     let encodings = state
+        .per_model_input_state
         .tokenizer
         .encode_text(vec![
             "hello world".to_string(),
@@ -69,7 +73,7 @@ fn test_sequence_classification_model() {
     let results = sequence_classification(
         session_lock,
         &transform,
-        &state.model_config,
+        &state.per_task_state,
         encodings.clone(),
     )
     .expect("Failed to compute results");
@@ -77,12 +81,15 @@ fn test_sequence_classification_model() {
     assert!(results.len() == encodings.len());
 }
 
+// FIXME doesn't compile
+/*
 #[test]
 #[should_panic]
 fn test_sequence_classification_inference_with_bad_model() {
     let state = embedding_state();
 
     let encodings = state
+        .per_model_input_state
         .tokenizer
         .encode_text(vec![
             "hello world".to_string(),
@@ -98,17 +105,19 @@ fn test_sequence_classification_inference_with_bad_model() {
     sequence_classification(
         session_lock,
         &transform,
-        &state.model_config,
+        &state.per_task_state,
         encodings.clone(),
     )
     .expect("Failed to compute results");
 }
+*/
 
 #[test]
 fn test_token_classification_model() {
     let state = token_classification_state();
 
     let encodings = state
+        .per_model_input_state
         .tokenizer
         .encode_text(vec![
             "hello world".to_string(),
@@ -124,7 +133,7 @@ fn test_token_classification_model() {
     let results = token_classification(
         session_lock,
         &transform,
-        &state.model_config,
+        &state.per_task_state,
         encodings.clone(),
     )
     .expect("Failed to compute results");
@@ -138,6 +147,7 @@ fn test_token_classification_inference_with_bad_model() {
     let state = sequence_classification_state();
 
     let encodings = state
+        .per_model_input_state
         .tokenizer
         .encode_text(vec![
             "hello world".to_string(),
@@ -153,8 +163,36 @@ fn test_token_classification_inference_with_bad_model() {
     token_classification(
         session_lock,
         &transform,
-        &state.model_config,
+        &state.per_task_state,
         encodings.clone(),
     )
     .expect("Failed to compute results");
 }
+
+#[test]
+fn test_image_classification_model() {
+    // TODO
+    /*
+    let state = embedding_state();
+
+    let encodings = state
+        .per_model_input_state
+        .tokenizer
+        .encode_text(vec![
+            "hello world".to_string(),
+            "the quick brown fox jumps over the lazy dog".to_string(),
+        ])
+        .expect("Failed to encode text");
+
+    let session_lock = state.session.lock();
+
+    let transform =
+        Transform::new(DEFAULT_LIBS.to_vec(), None).expect("Failed to create_transform");
+
+    let results =
+        embedding(session_lock, &transform, encodings.clone()).expect("Failed to compute results");
+
+    assert!(results.len() == encodings.len());
+    */
+}
+
diff --git a/test_img_class_config.yml b/test_img_class_config.yml
new file mode 100644
index 00000000..723a0bda
--- /dev/null
+++ b/test_img_class_config.yml
@@ -0,0 +1,6 @@
+encoderfile:
+  name: test-img-class
+  path: models/image_classification
+  model_type: image_classification
+  output_path: ./test-img-class.encoderfile
+