| { | |
| "processor": { | |
| "name": "phi_4_vision_processor", | |
| "transforms": [ | |
| { | |
| "operation": { | |
| "name": "decode_image", | |
| "type": "DecodeImage", | |
| "attrs": { | |
| "color_space": "RGB" | |
| } | |
| } | |
| }, | |
| { | |
| "operation": { | |
| "name": "phi4_vision_dynamic_preprocess", | |
| "type": "Phi4VisionDynamicPreprocess", | |
| "attrs": { | |
| "dynamic_hd": 36, | |
| "dyhd_base_resolution": 448 | |
| } | |
| } | |
| }, | |
| { | |
| "operation": { | |
| "name": "rescale", | |
| "type": "Rescale", | |
| "inputs": [ | |
| ":0" | |
| ] | |
| } | |
| }, | |
| { | |
| "operation": { | |
| "name": "normalize", | |
| "type": "Normalize", | |
| "attrs": { | |
| "mean": [ | |
| 0.5, | |
| 0.5, | |
| 0.5 | |
| ], | |
| "std": [ | |
| 0.5, | |
| 0.5, | |
| 0.5 | |
| ] | |
| } | |
| } | |
| }, | |
| { | |
| "operation": { | |
| "name": "phi4_vision_processor", | |
| "type": "Phi4VisionProcessor", | |
| "inputs": [ | |
| ":0", | |
| "phi4_vision_dynamic_preprocess:1" | |
| ], | |
| "attrs": { | |
| "dyhd_base_resolution": 448, | |
| "interpolation": "CUBIC" | |
| } | |
| } | |
| } | |
| ], | |
| "output_aligner": "phi4-vision-aligner" | |
| } | |
| } |