Spaces:

TiniThingsInc
/

ffembeds

Sleeping

App Files Files Community

TiniThingsInc commited on Nov 13

Commit

f9fe5e0

verified ·

1 Parent(s): 15a2e15

Update app.py

Browse files

Files changed (1) hide show

app.py +29 -36

app.py CHANGED Viewed

@@ -1,5 +1,5 @@
 """
-FairFate Embeddings API - Qwen3-Embedding-4B
 Multilingual semantic embeddings for tabletop RPG product classification
 """
@@ -13,9 +13,9 @@ import spaces  # ZeroGPU decorator
 # Using Qwen3-Embedding-4B for 2560 native dimensions (truncate to 1536 for production)
 # Qwen3-4B is optimal for 1536 dims: 60% retention (vs 42.9% for GTE-Qwen2-7B)
 MODEL_NAME = "Qwen/Qwen3-Embedding-4B"
-print(f"🔄 Loading model: {MODEL_NAME}")
 model = SentenceTransformer(MODEL_NAME, trust_remote_code=True)
-print(f"✅ Model loaded successfully")
 print(f"   Native Dimensions: {model.get_sentence_embedding_dimension()}")
 print(f"   Max Seq Length: {model.max_seq_length}")
 print(f"   Matryoshka Support: Yes (truncate to any dimension ≤ {model.get_sentence_embedding_dimension()})")
@@ -64,7 +64,7 @@ def generate_embeddings(
     # Qwen3-Embedding models support truncation to any dimension ≤ native_dims
     if output_dimensions != native_dims:
         if output_dimensions > native_dims:
-            print(f"⚠️ Warning: Requested {output_dimensions} dims but model has {native_dims}. Using {native_dims}.")
             output_dimensions = native_dims
         embeddings = embeddings[:, :output_dimensions]
@@ -84,9 +84,9 @@ def batch_generate(texts_input: str, use_instruction: bool, output_dims: int) ->
     try:
         embeddings = generate_embeddings(texts, use_instruction, output_dims)
-        result = f"✅ Generated {len(embeddings)} embeddings\n"
-        result += f"📐 Dimensions: {len(embeddings[0])}\n"
-        result += f"🌍 Languages: 100+ supported\n\n"
         result += "First embedding preview:\n"
         result += f"[{', '.join(f'{x:.3f}' for x in embeddings[0][:10])}...]\n"
@@ -170,7 +170,7 @@ def calculate_similarity(text1: str, text2: str, use_instruction: bool) -> str:
     Calculate comprehensive similarity metrics between two texts
     """
     if not text1.strip() or not text2.strip():
-        return "❌ Error: Please provide both texts"
     try:
         embeddings = generate_embeddings([text1, text2], use_instruction)
@@ -181,7 +181,7 @@ def calculate_similarity(text1: str, text2: str, use_instruction: bool) -> str:
         metrics = calculate_all_similarities(emb1, emb2)
         # Build result string
-        result = "📊 **Comprehensive Similarity Analysis**\n\n"
         # Cosine Similarity (Primary)
         emoji, interpretation = interpret_similarity(metrics['cosine'], 'cosine')
@@ -222,23 +222,23 @@ def calculate_similarity(text1: str, text2: str, use_instruction: bool) -> str:
         return f"❌ Error: {str(e)}"
 # Create Gradio interface
-with gr.Blocks(title="FairFate Embeddings API - Qwen3", theme=gr.themes.Soft()) as demo:
     gr.Markdown("""
-    # 🎲 FairFate Embeddings API
     **Powered by Qwen3-Embedding-4B** - Advanced Multilingual Embedding Model
-    - 🌍 **100+ Languages** (English, Spanish, French, German, Chinese, Japanese, etc.)
-    - 📐 **2560 Native Dimensions** (matryoshka truncation to 1536 for production)
-    - 📚 **32K Context** (massive text support)
-    - ⚡ **Instruction-Aware** (optimized for RPG content)
-    - 🔬 **Matryoshka Support** (flexible 32-2560 dimensions)
-    - 🏆 **Optimal for 1536 dims** (60% dimension retention)
     Perfect for: Product classification, semantic search, recommendations, multilingual matching
     """)
-    with gr.Tab("🔮 Generate Embeddings"):
         gr.Markdown("""
         Generate semantic embeddings for product descriptions, titles, or any text.
         Enter one text per line for batch processing.
@@ -271,7 +271,7 @@ with gr.Blocks(title="FairFate Embeddings API - Qwen3", theme=gr.themes.Soft())
             inputs=[input_text, use_inst, output_dims],
         )
-    with gr.Tab("🔍 Similarity Calculator"):
         gr.Markdown("""
         **Comprehensive Similarity Analysis** - Compare two texts using multiple metrics:
@@ -314,9 +314,9 @@ with gr.Blocks(title="FairFate Embeddings API - Qwen3", theme=gr.themes.Soft())
             inputs=[text1, text2, use_inst_sim],
         )
-    with gr.Tab("📖 API Documentation"):
         gr.Markdown("""
-        ## 🚀 Quick Start
         ### Python
@@ -324,7 +324,7 @@ with gr.Blocks(title="FairFate Embeddings API - Qwen3", theme=gr.themes.Soft())
         import requests
         import numpy as np
-        url = "https://YOUR_USERNAME-fairfate-embeddings.hf.space/api/predict"
         # Generate embeddings
         texts = [
@@ -350,7 +350,7 @@ with gr.Blocks(title="FairFate Embeddings API - Qwen3", theme=gr.themes.Soft())
         ### TypeScript/JavaScript
         ```typescript
-        const url = 'https://YOUR_USERNAME-fairfate-embeddings.hf.space/api/predict';
         const response = await fetch(url, {
           method: 'POST',
@@ -373,7 +373,7 @@ with gr.Blocks(title="FairFate Embeddings API - Qwen3", theme=gr.themes.Soft())
         ```bash
         curl -X POST \\
-          https://YOUR_USERNAME-fairfate-embeddings.hf.space/api/predict \\
           -H "Content-Type: application/json" \\
           -d '{
             "data": [["Your text here"], true, 1536],
@@ -381,7 +381,7 @@ with gr.Blocks(title="FairFate Embeddings API - Qwen3", theme=gr.themes.Soft())
           }'
         ```
-        ## 📊 Parameters
         | Parameter | Type | Default | Description |
         |-----------|------|---------|-------------|
@@ -389,7 +389,7 @@ with gr.Blocks(title="FairFate Embeddings API - Qwen3", theme=gr.themes.Soft())
         | `use_instruction` | boolean | true | Add instruction prefix (improves accuracy) |
         | `output_dimensions` | number | 1536 | Output size (32-3584, production default: 1536) |
-        ## 🎯 Use Cases
         - **Product Classification**: Auto-tag by genre, system, theme
         - **Semantic Search**: Find by meaning, not keywords
@@ -397,20 +397,13 @@ with gr.Blocks(title="FairFate Embeddings API - Qwen3", theme=gr.themes.Soft())
         - **Duplicate Detection**: Find similar listings
         - **Multilingual Matching**: Cross-language similarity
-        ## ⚡ Performance
-        | Batch Size | GPU Throughput | CPU Throughput |
-        |------------|----------------|----------------|
-        | 1          | ~800/sec       | ~80/sec        |
-        | 32         | ~4000/sec      | ~250/sec       |
-        ## 🌍 Supported Languages
         English, Spanish, French, German, Italian, Portuguese, Russian, Polish, Dutch, Czech,
         Chinese, Japanese, Korean, Arabic, Hebrew, Hindi, Thai, Vietnamese, Indonesian,
         Turkish, Swedish, Norwegian, Danish, Finnish, Greek, Romanian, Hungarian, and 80+ more!
-        ## 📝 Citation
         ```bibtex
         @misc{qwen3-embedding-2025,
@@ -422,7 +415,7 @@ with gr.Blocks(title="FairFate Embeddings API - Qwen3", theme=gr.themes.Soft())
         ```
         """)
-    with gr.Tab("ℹ️ Model Info"):
         gr.Markdown(f"""
         ## Model Details

 """
+FF Embeddings API - Qwen3-Embedding-4B
 Multilingual semantic embeddings for tabletop RPG product classification
 """
 # Using Qwen3-Embedding-4B for 2560 native dimensions (truncate to 1536 for production)
 # Qwen3-4B is optimal for 1536 dims: 60% retention (vs 42.9% for GTE-Qwen2-7B)
 MODEL_NAME = "Qwen/Qwen3-Embedding-4B"
+print(f"   Loading model: {MODEL_NAME}")
 model = SentenceTransformer(MODEL_NAME, trust_remote_code=True)
+print(f"   Model loaded successfully")
 print(f"   Native Dimensions: {model.get_sentence_embedding_dimension()}")
 print(f"   Max Seq Length: {model.max_seq_length}")
 print(f"   Matryoshka Support: Yes (truncate to any dimension ≤ {model.get_sentence_embedding_dimension()})")
     # Qwen3-Embedding models support truncation to any dimension ≤ native_dims
     if output_dimensions != native_dims:
         if output_dimensions > native_dims:
+            print(f"Warning: Requested {output_dimensions} dims but model has {native_dims}. Using {native_dims}.")
             output_dimensions = native_dims
         embeddings = embeddings[:, :output_dimensions]
     try:
         embeddings = generate_embeddings(texts, use_instruction, output_dims)
+        result = f"Generated {len(embeddings)} embeddings\n"
+        result += f"Dimensions: {len(embeddings[0])}\n"
+        result += f"Languages: 100+ supported\n\n"
         result += "First embedding preview:\n"
         result += f"[{', '.join(f'{x:.3f}' for x in embeddings[0][:10])}...]\n"
     Calculate comprehensive similarity metrics between two texts
     """
     if not text1.strip() or not text2.strip():
+        return "Error: Please provide both texts"
     try:
         embeddings = generate_embeddings([text1, text2], use_instruction)
         metrics = calculate_all_similarities(emb1, emb2)
         # Build result string
+        result = "**Comprehensive Similarity Analysis**\n\n"
         # Cosine Similarity (Primary)
         emoji, interpretation = interpret_similarity(metrics['cosine'], 'cosine')
         return f"❌ Error: {str(e)}"
 # Create Gradio interface
+with gr.Blocks(title="FF Embeddings API - Qwen3", theme=gr.themes.Soft()) as demo:
     gr.Markdown("""
+    # FF Embeddings API
     **Powered by Qwen3-Embedding-4B** - Advanced Multilingual Embedding Model
+    - **100+ Languages** (English, Spanish, French, German, Chinese, Japanese, etc.)
+    - **2560 Native Dimensions** (matryoshka truncation to 1536 for production)
+    - **32K Context** (massive text support)
+    - **Instruction-Aware** (optimized for RPG content)
+    - **Matryoshka Support** (flexible 32-2560 dimensions)
+    - **Optimal for 1536 dims** (60% dimension retention)
     Perfect for: Product classification, semantic search, recommendations, multilingual matching
     """)
+    with gr.Tab("Generate Embeddings"):
         gr.Markdown("""
         Generate semantic embeddings for product descriptions, titles, or any text.
         Enter one text per line for batch processing.
             inputs=[input_text, use_inst, output_dims],
         )
+    with gr.Tab("Similarity Calculator"):
         gr.Markdown("""
         **Comprehensive Similarity Analysis** - Compare two texts using multiple metrics:
             inputs=[text1, text2, use_inst_sim],
         )
+    with gr.Tab("API Documentation"):
         gr.Markdown("""
+        ## Quick Start
         ### Python
         import requests
         import numpy as np
+        url = "https://TiniThingsInc-fairfate-embeddings.hf.space/api/predict"
         # Generate embeddings
         texts = [
         ### TypeScript/JavaScript
         ```typescript
+        const url = 'https://TiniThingsInc-fairfate-embeddings.hf.space/api/predict';
         const response = await fetch(url, {
           method: 'POST',
         ```bash
         curl -X POST \\
+          https://TiniThingsInc-fairfate-embeddings.hf.space/api/predict \\
           -H "Content-Type: application/json" \\
           -d '{
             "data": [["Your text here"], true, 1536],
           }'
         ```
+        ## Parameters
         | Parameter | Type | Default | Description |
         |-----------|------|---------|-------------|
         | `use_instruction` | boolean | true | Add instruction prefix (improves accuracy) |
         | `output_dimensions` | number | 1536 | Output size (32-3584, production default: 1536) |
+        ## Use Cases
         - **Product Classification**: Auto-tag by genre, system, theme
         - **Semantic Search**: Find by meaning, not keywords
         - **Duplicate Detection**: Find similar listings
         - **Multilingual Matching**: Cross-language similarity
+        ## Supported Languages
         English, Spanish, French, German, Italian, Portuguese, Russian, Polish, Dutch, Czech,
         Chinese, Japanese, Korean, Arabic, Hebrew, Hindi, Thai, Vietnamese, Indonesian,
         Turkish, Swedish, Norwegian, Danish, Finnish, Greek, Romanian, Hungarian, and 80+ more!
+        ## Citation
         ```bibtex
         @misc{qwen3-embedding-2025,
         ```
         """)
+    with gr.Tab("Model Info"):
         gr.Markdown(f"""
         ## Model Details