File tree Expand file tree Collapse file tree 1 file changed +4
-4
lines changed
xinference/model/embedding/sentence_transformers Expand file tree Collapse file tree 1 file changed +4
-4
lines changed Original file line number Diff line number Diff line change @@ -449,13 +449,13 @@ def match_json(
449449
450450 # Check model dimensions compatibility
451451 model_dimensions = model_family .dimensions
452- if model_dimensions > 1536 : # Very large embedding models
453- return f"Large embedding model detected ({ model_dimensions } dimensions), may have performance issues"
452+ if model_dimensions > 8192 : # Extremely large embedding models
453+ return f"Extremely large embedding model detected ({ model_dimensions } dimensions), may have performance issues"
454454
455455 # Check token limits
456456 max_tokens = model_family .max_tokens
457- if max_tokens > 8192 : # Very high token limits
458- return f"High token limit model detected (max_tokens: { max_tokens } ), may cause memory issues"
457+ if max_tokens > 131072 : # Extremely high token limits (128K)
458+ return f"Extremely high token limit model detected (max_tokens: { max_tokens } ), may cause memory issues"
459459
460460 # Check for special model requirements
461461 model_name = model_family .model_name .lower ()
You can’t perform that action at this time.
0 commit comments