furiosa.server.api.rest package
Submodules
furiosa.server.api.rest.app module
- furiosa.server.api.rest.app.create(config: furiosa.server.settings.RESTServerConfig, predict_handler: furiosa.server.handlers.predict.PredictHandler, repository_handler: furiosa.server.handlers.repository.RepositoryHandler) fastapi.applications.FastAPI
- furiosa.server.api.rest.app.exception_handler(request: starlette.requests.Request, exc: furiosa.server.errors.ModelServerError) starlette.responses.JSONResponse
furiosa.server.api.rest.endpoints module
- class furiosa.server.api.rest.endpoints.BooleanResponse(response: bool, error_code: int = 400)
Bases:
starlette.responses.Response
- class furiosa.server.api.rest.endpoints.ModelEndpoints(handler: furiosa.server.handlers.predict.PredictHandler)
Bases:
object
- async infer(payload: furiosa.server.types.predict.InferenceRequest, model_name: str, model_version: Optional[str] = None) furiosa.server.types.predict.InferenceResponse
- async live() starlette.responses.Response
- async metadata() furiosa.server.types.predict.MetadataServerResponse
- async model_metadata(model_name: str, model_version: Optional[str] = None) furiosa.server.types.predict.MetadataModelResponse
- async model_ready(model_name: str, model_version: Optional[str] = None) starlette.responses.Response
- async ready() starlette.responses.Response
- class furiosa.server.api.rest.endpoints.ModelRepositoryEndpoints(handler: furiosa.server.handlers.repository.RepositoryHandler)
Bases:
object
- async index(payload: furiosa.server.types.model_repository.RepositoryIndexRequest) furiosa.server.types.model_repository.RepositoryIndexResponse
- async load(model_name: str) starlette.responses.Response
- async unload(model_name: str) starlette.responses.Response
furiosa.server.api.rest.server module
- class furiosa.server.api.rest.server.RESTServer(config: furiosa.server.settings.RESTServerConfig, predict_handler: furiosa.server.handlers.predict.PredictHandler, repository_handler: furiosa.server.handlers.repository.RepositoryHandler)
Bases:
object
- async start()
- async stop()