sparkleman commited on
Commit
50f89e3
·
1 Parent(s): ce2c37c

UPDATE: change default model load workflow

Browse files
Files changed (3) hide show
  1. app.py +17 -7
  2. config.production.yaml +11 -11
  3. config.py +2 -1
app.py CHANGED
@@ -87,11 +87,19 @@ for model_config in CONFIG.MODELS:
87
  )
88
  tmp_pipeline = PIPELINE(tmp_model, model_config.VOCAB)
89
 
90
- if model_config.DEFAULT:
91
- if model_config.REASONING:
92
- DEFAULT_REASONING_MODEL_NAME = model_config.SERVICE_NAME
93
- else:
94
- DEFALUT_MODEL_NAME = model_config.SERVICE_NAME
 
 
 
 
 
 
 
 
95
 
96
  print(model_config.DEFAULT_SAMPLER)
97
 
@@ -101,8 +109,10 @@ for model_config in CONFIG.MODELS:
101
  MODEL_STORAGE[model_config.SERVICE_NAME].pipeline = tmp_pipeline
102
 
103
 
104
- logger.info(f"DEFALUT_MODEL_NAME is `{DEFALUT_MODEL_NAME}`")
105
- logger.info(f"DEFAULT_REASONING_MODEL_NAME is `{DEFAULT_REASONING_MODEL_NAME}`")
 
 
106
 
107
 
108
  class ChatCompletionRequest(BaseModel):
 
87
  )
88
  tmp_pipeline = PIPELINE(tmp_model, model_config.VOCAB)
89
 
90
+ if model_config.DEFAULT_CHAT:
91
+ if DEFALUT_MODEL_NAME != None:
92
+ logger.info(
93
+ f"Load Model - Replace `DEFALUT_MODEL_NAME` from `{DEFALUT_MODEL_NAME}` to `{model_config.SERVICE_NAME}`"
94
+ )
95
+ DEFALUT_MODEL_NAME = model_config.SERVICE_NAME
96
+
97
+ if model_config.DEFAULT_REASONING:
98
+ if DEFAULT_REASONING_MODEL_NAME != None:
99
+ logger.info(
100
+ f"Load Model - Replace `DEFAULT_REASONING_MODEL_NAME` from `{DEFAULT_REASONING_MODEL_NAME}` to `{model_config.SERVICE_NAME}`"
101
+ )
102
+ DEFAULT_REASONING_MODEL_NAME = model_config.SERVICE_NAME
103
 
104
  print(model_config.DEFAULT_SAMPLER)
105
 
 
109
  MODEL_STORAGE[model_config.SERVICE_NAME].pipeline = tmp_pipeline
110
 
111
 
112
+ logger.info(f"Load Model - DEFALUT_MODEL_NAME is `{DEFALUT_MODEL_NAME}`")
113
+ logger.info(
114
+ f"Load Model - DEFAULT_REASONING_MODEL_NAME is `{DEFAULT_REASONING_MODEL_NAME}`"
115
+ )
116
 
117
 
118
  class ChatCompletionRequest(BaseModel):
config.production.yaml CHANGED
@@ -1,16 +1,17 @@
1
  HOST: "0.0.0.0"
2
  PORT: 7860
3
  STRATEGY: "cuda fp16"
4
- RWKV_CUDA_ON: False
5
  CHUNK_LEN: 256
6
  MODELS:
7
- - SERVICE_NAME: "RWKV-x070-World-0.1B-v2.8-20241210-ctx4096"
8
- DOWNLOAD_MODEL_FILE_NAME: "RWKV-x070-World-0.1B-v2.8-20241210-ctx4096.pth"
9
- DOWNLOAD_MODEL_REPO_ID: "BlinkDL/rwkv-7-world"
10
- REASONING: False
11
- DEFAULT: True
 
12
  DEFAULT_SAMPLER:
13
- max_tokens: 512
14
  temperature: 1.0
15
  top_p: 0.3
16
  presence_penalty: 0.5
@@ -20,11 +21,10 @@ MODELS:
20
  - "\n\n"
21
  stop_tokens:
22
  - 0
23
- - SERVICE_NAME: "rwkv7-g1-0.1b-20250307-ctx4096"
24
- DOWNLOAD_MODEL_FILE_NAME: "rwkv7-g1-0.1b-20250307-ctx4096.pth"
25
- DOWNLOAD_MODEL_REPO_ID: "BlinkDL/rwkv7-g1"
26
  REASONING: True
27
- DEFAULT: True
28
  DEFAULT_SAMPLER:
29
  max_tokens: 4096
30
  temperature: 1.0
 
1
  HOST: "0.0.0.0"
2
  PORT: 7860
3
  STRATEGY: "cuda fp16"
4
+ RWKV_CUDA_ON: True
5
  CHUNK_LEN: 256
6
  MODELS:
7
+ - SERVICE_NAME: "rwkv7-g1-0.1b-20250307-ctx4096"
8
+ DOWNLOAD_MODEL_FILE_NAME: "rwkv7-g1-0.1b-20250307-ctx4096.pth"
9
+ DOWNLOAD_MODEL_REPO_ID: "BlinkDL/rwkv7-g1"
10
+ REASONING: True
11
+ DEFAULT_CHAT: True
12
+ DEFAULT_REASONING: True
13
  DEFAULT_SAMPLER:
14
+ max_tokens: 4096
15
  temperature: 1.0
16
  top_p: 0.3
17
  presence_penalty: 0.5
 
21
  - "\n\n"
22
  stop_tokens:
23
  - 0
24
+ - SERVICE_NAME: "RWKV7-G1-1.5B-16%trained-20250308-ctx4k"
25
+ DOWNLOAD_MODEL_FILE_NAME: "RWKV7-G1-1.5B-16%trained-20250308-ctx4k.pth"
26
+ DOWNLOAD_MODEL_REPO_ID: "BlinkDL/rwkv-7-world"
27
  REASONING: True
 
28
  DEFAULT_SAMPLER:
29
  max_tokens: 4096
30
  temperature: 1.0
config.py CHANGED
@@ -49,7 +49,8 @@ class ModelConfig(BaseModel):
49
  False, description="Whether reasoning is enabled for this model."
50
  )
51
 
52
- DEFAULT: bool = Field(False, description="Whether this model is the default model.")
 
53
  DEFAULT_SAMPLER: SamplerConfig = Field(
54
  SamplerConfig(), description="Default sampler configuration for this model."
55
  )
 
49
  False, description="Whether reasoning is enabled for this model."
50
  )
51
 
52
+ DEFAULT_CHAT: bool = Field(False, description="Whether this model is the default chat model.")
53
+ DEFAULT_REASONING: bool = Field(False, description="Whether this model is the default reasoning model.")
54
  DEFAULT_SAMPLER: SamplerConfig = Field(
55
  SamplerConfig(), description="Default sampler configuration for this model."
56
  )