Skip to content

Commit f52824a

Browse files
committed
modify embedding sentence_transformers
1 parent 1b973b4 commit f52824a

File tree

1 file changed

+4
-4
lines changed
  • xinference/model/embedding/sentence_transformers

1 file changed

+4
-4
lines changed

xinference/model/embedding/sentence_transformers/core.py

Lines changed: 4 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -449,13 +449,13 @@ def match_json(
449449

450450
# Check model dimensions compatibility
451451
model_dimensions = model_family.dimensions
452-
if model_dimensions > 1536: # Very large embedding models
453-
return f"Large embedding model detected ({model_dimensions} dimensions), may have performance issues"
452+
if model_dimensions > 8192: # Extremely large embedding models
453+
return f"Extremely large embedding model detected ({model_dimensions} dimensions), may have performance issues"
454454

455455
# Check token limits
456456
max_tokens = model_family.max_tokens
457-
if max_tokens > 8192: # Very high token limits
458-
return f"High token limit model detected (max_tokens: {max_tokens}), may cause memory issues"
457+
if max_tokens > 131072: # Extremely high token limits (128K)
458+
return f"Extremely high token limit model detected (max_tokens: {max_tokens}), may cause memory issues"
459459

460460
# Check for special model requirements
461461
model_name = model_family.model_name.lower()

0 commit comments

Comments
 (0)