Skip to content

Commit

Permalink
fix: correctly set quantise for non quantise options
Browse files Browse the repository at this point in the history
Signed-off-by: Aaron Pham <contact@aarnphm.xyz>
  • Loading branch information
aarnphm committed Jun 14, 2024
1 parent 316925f commit d7e99c2
Show file tree
Hide file tree
Showing 2 changed files with 3 additions and 3 deletions.
4 changes: 2 additions & 2 deletions openllm-python/src/_openllm_tiny/_entrypoint.py
Original file line number Diff line number Diff line change
Expand Up @@ -43,7 +43,7 @@
import orjson,openllm_core.utils as coreutils
model_id='{__model_id__}'
revision=orjson.loads(coreutils.getenv('revision',default={__model_revision__}))
quantise=coreutils.getenv('quantize',default='{__model_quantise__}',var=['QUANTISE'])
quantise=orjson.loads(coreutils.getenv('quantize',default={__model_quantise__},var=['QUANTISE']))
serialisation=coreutils.getenv('serialization',default='{__model_serialization__}',var=['SERIALISATION'])
dtype=coreutils.getenv('dtype', default='{__model_dtype__}',var=['TORCH_DTYPE'])
trust_remote_code=coreutils.check_bool_env("TRUST_REMOTE_CODE",{__model_trust_remote_code__})
Expand Down Expand Up @@ -485,7 +485,7 @@ def build_command(
__command__=' '.join(['openllm', *sys.argv[1:]]),
__model_id__=model_id,
__model_revision__=orjson.dumps(model_revision),
__model_quantise__=quantise,
__model_quantise__=orjson.dumps(quantise),
__model_dtype__=dtype,
__model_serialization__=serialisation,
__model_trust_remote_code__=trust_remote_code,
Expand Down
2 changes: 1 addition & 1 deletion tools/dependencies.py
Original file line number Diff line number Diff line change
Expand Up @@ -234,7 +234,7 @@ def main(args) -> int:
release_version = args.release_version
else:
try:
release_version = api.repos.get_latest_release()['name'].lstrip('v')
release_version = api.repos.get_latest_release()['tag_name'].lstrip('v')
except Exception as err:
raise err

Expand Down

0 comments on commit d7e99c2

Please sign in to comment.