drizzlezyk commited on
Commit
73fe7ab
·
verified ·
1 Parent(s): 5893154

Upload inference/vllm_register.py with huggingface_hub

Browse files
Files changed (1) hide show
  1. inference/vllm_register.py +31 -0
inference/vllm_register.py ADDED
@@ -0,0 +1,31 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # coding=utf-8
2
+ # Copyright (c) 2025 Huawei Technologies Co., Ltd. All Rights Reserved.
3
+ # Copyright 2022 EleutherAI and the HuggingFace Inc. team. All rights reserved.
4
+ #
5
+ # This code is based on EleutherAI's GPT-NeoX library and the GPT-NeoX
6
+ # and OPT implementations in this library. It has been modified from its
7
+ # original forms to accommodate minor architectural differences compared
8
+ # to GPT-NeoX and OPT used by the Meta AI team that trained the model.
9
+ #
10
+ # Licensed under the Apache License, Version 2.0 (the "License");
11
+ # you may not use this file except in compliance with the License.
12
+ # You may obtain a copy of the License at
13
+ #
14
+ # http://www.apache.org/licenses/LICENSE-2.0
15
+ #
16
+ # Unless required by applicable law or agreed to in writing, software
17
+ # distributed under the License is distributed on an "AS IS" BASIS,
18
+ # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
19
+ # See the License for the specific language governing permissions and
20
+ # limitations under the License.
21
+
22
+ import runpy
23
+ from vllm import ModelRegistry
24
+ from modeling_openpangu import PanguEmbeddedForCausalLM
25
+ import torch
26
+
27
+
28
+ ModelRegistry.register_model("PanguEmbeddedForCausalLM", PanguEmbeddedForCausalLM)
29
+
30
+ if __name__ == '__main__':
31
+ runpy.run_module('vllm.entrypoints.openai.api_server', run_name='__main__')