model_config: model_name: "microsoft/Phi-3-mini-4k-instruct" torch_dtype: "float32" trust_remote_code: True use_cache: True attn_implementation: "eager" device_map: "cpu" # Remove the load_in_8bit line