diff --git a/charms/kserve-controller/tests/integration/hugginface-bert.yaml b/charms/kserve-controller/tests/integration/hugginface-bert.yaml new file mode 100644 index 0000000..6d662fc --- /dev/null +++ b/charms/kserve-controller/tests/integration/hugginface-bert.yaml @@ -0,0 +1,19 @@ +apiVersion: serving.kserve.io/v1beta1 +kind: InferenceService +metadata: + name: huggingface-bert +spec: + predictor: + model: + modelFormat: + name: huggingface + args: + - --model_name=bert + - --model_id=google-bert/bert-base-uncased + resources: + limits: + cpu: 1 + memory: 500Mi + requests: + cpu: 100m + memory: 250Mi diff --git a/charms/kserve-controller/tests/integration/test_charm.py b/charms/kserve-controller/tests/integration/test_charm.py index 0090b09..bbb1af6 100644 --- a/charms/kserve-controller/tests/integration/test_charm.py +++ b/charms/kserve-controller/tests/integration/test_charm.py @@ -271,6 +271,7 @@ def create_namespace(): @pytest.mark.parametrize( "inference_file", [ + "./tests/integration/hugginface-bert.yaml", "./tests/integration/sklearn-iris.yaml", "./tests/integration/lgbserver.yaml", "./tests/integration/pmml-server.yaml", @@ -300,8 +301,8 @@ def create_inf_svc(): # Assert InferenceService state is Available @tenacity.retry( - wait=tenacity.wait_exponential(multiplier=1, min=1, max=15), - stop=tenacity.stop_after_attempt(30), + wait=tenacity.wait_exponential(multiplier=1, min=1, max=30), + stop=tenacity.stop_after_attempt(60), reraise=True, ) def assert_inf_svc_state():