Technologic101 commited on
Commit
ab1d8bc
·
1 Parent(s): 41422db

task: add fine-tuning and evaluation

Browse files
pyproject.toml CHANGED
@@ -35,6 +35,8 @@ dependencies = [
35
  "websockets>=11.0.3",
36
  "langsmith>=0.3.11",
37
  "matplotlib>=3.10.0",
 
 
38
  ]
39
 
40
  [build-system]
 
35
  "websockets>=11.0.3",
36
  "langsmith>=0.3.11",
37
  "matplotlib>=3.10.0",
38
+ "accelerate>=0.26.0",
39
+ "nest-asyncio>=1.6.0",
40
  ]
41
 
42
  [build-system]
src/fine_tune_embeddings.ipynb ADDED
@@ -0,0 +1,903 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "cells": [
3
+ {
4
+ "cell_type": "markdown",
5
+ "metadata": {},
6
+ "source": [
7
+ "# Fine-tuning Embeddings for Design Data"
8
+ ]
9
+ },
10
+ {
11
+ "cell_type": "markdown",
12
+ "metadata": {},
13
+ "source": [
14
+ "Let's see if we can improve the quality of our returned results using a fine-tuned embedding model trained on our designs!\n",
15
+ "\n",
16
+ "We'll use SentenceTransformers to fine-tune our embedding model, as it provides a straightforward approach for adapting models to specific domains."
17
+ ]
18
+ },
19
+ {
20
+ "cell_type": "code",
21
+ "execution_count": 1,
22
+ "metadata": {},
23
+ "outputs": [],
24
+ "source": [
25
+ "# Install required packages if needed\n",
26
+ "# !pip install sentence-transformers datasets torch matplotlib"
27
+ ]
28
+ },
29
+ {
30
+ "cell_type": "code",
31
+ "execution_count": 2,
32
+ "metadata": {},
33
+ "outputs": [],
34
+ "source": [
35
+ "import json\n",
36
+ "import os\n",
37
+ "import pandas as pd\n",
38
+ "import numpy as np\n",
39
+ "import torch\n",
40
+ "import matplotlib.pyplot as plt\n",
41
+ "from pathlib import Path\n",
42
+ "from sentence_transformers import SentenceTransformer, InputExample, losses\n",
43
+ "from sentence_transformers.evaluation import EmbeddingSimilarityEvaluator\n",
44
+ "from torch.utils.data import DataLoader"
45
+ ]
46
+ },
47
+ {
48
+ "cell_type": "markdown",
49
+ "metadata": {},
50
+ "source": [
51
+ "## 1. Load Design Data\n",
52
+ "\n",
53
+ "First, we'll load the design data from our existing dataset."
54
+ ]
55
+ },
56
+ {
57
+ "cell_type": "code",
58
+ "execution_count": 3,
59
+ "metadata": {},
60
+ "outputs": [
61
+ {
62
+ "name": "stdout",
63
+ "output_type": "stream",
64
+ "text": [
65
+ "/Users/owner/Desktop/Projects/ai-maker-space/code/ImagineUI/src/data/designs\n",
66
+ "Loaded 141 designs\n"
67
+ ]
68
+ },
69
+ {
70
+ "data": {
71
+ "text/html": [
72
+ "<div>\n",
73
+ "<style scoped>\n",
74
+ " .dataframe tbody tr th:only-of-type {\n",
75
+ " vertical-align: middle;\n",
76
+ " }\n",
77
+ "\n",
78
+ " .dataframe tbody tr th {\n",
79
+ " vertical-align: top;\n",
80
+ " }\n",
81
+ "\n",
82
+ " .dataframe thead th {\n",
83
+ " text-align: right;\n",
84
+ " }\n",
85
+ "</style>\n",
86
+ "<table border=\"1\" class=\"dataframe\">\n",
87
+ " <thead>\n",
88
+ " <tr style=\"text-align: right;\">\n",
89
+ " <th></th>\n",
90
+ " <th>id</th>\n",
91
+ " <th>text</th>\n",
92
+ " <th>categories</th>\n",
93
+ " <th>visual_characteristics</th>\n",
94
+ " </tr>\n",
95
+ " </thead>\n",
96
+ " <tbody>\n",
97
+ " <tr>\n",
98
+ " <th>0</th>\n",
99
+ " <td>135</td>\n",
100
+ " <td>Design 135:\\n Description: This des...</td>\n",
101
+ " <td>[Traditional, Elegant, Text-Heavy, Classic]</td>\n",
102
+ " <td>[Muted Color Palette, Vertical Layout, Serif T...</td>\n",
103
+ " </tr>\n",
104
+ " <tr>\n",
105
+ " <th>1</th>\n",
106
+ " <td>132</td>\n",
107
+ " <td>Design 132:\\n Description: This des...</td>\n",
108
+ " <td>[minimalist, nature-inspired, modern, zen-them...</td>\n",
109
+ " <td>[white background, green accents, illustrative...</td>\n",
110
+ " </tr>\n",
111
+ " <tr>\n",
112
+ " <th>2</th>\n",
113
+ " <td>104</td>\n",
114
+ " <td>Design 104:\\n Description: The CSS ...</td>\n",
115
+ " <td>[minimalism, elegance, typography, web design ...</td>\n",
116
+ " <td>[subtle color palette, classic serif fonts, cl...</td>\n",
117
+ " </tr>\n",
118
+ " <tr>\n",
119
+ " <th>3</th>\n",
120
+ " <td>103</td>\n",
121
+ " <td>Design 103:\\n Description: This des...</td>\n",
122
+ " <td>[vintage, classical, dramatic, ornate, elegant]</td>\n",
123
+ " <td>[dark color palette, gold accents, traditional...</td>\n",
124
+ " </tr>\n",
125
+ " <tr>\n",
126
+ " <th>4</th>\n",
127
+ " <td>168</td>\n",
128
+ " <td>Design 168:\\n Description: This des...</td>\n",
129
+ " <td>[Humorous, Educational, Whimsical, Nature-them...</td>\n",
130
+ " <td>[Vibrant color palette, Whimsical illustration...</td>\n",
131
+ " </tr>\n",
132
+ " </tbody>\n",
133
+ "</table>\n",
134
+ "</div>"
135
+ ],
136
+ "text/plain": [
137
+ " id text \\\n",
138
+ "0 135 Design 135:\\n Description: This des... \n",
139
+ "1 132 Design 132:\\n Description: This des... \n",
140
+ "2 104 Design 104:\\n Description: The CSS ... \n",
141
+ "3 103 Design 103:\\n Description: This des... \n",
142
+ "4 168 Design 168:\\n Description: This des... \n",
143
+ "\n",
144
+ " categories \\\n",
145
+ "0 [Traditional, Elegant, Text-Heavy, Classic] \n",
146
+ "1 [minimalist, nature-inspired, modern, zen-them... \n",
147
+ "2 [minimalism, elegance, typography, web design ... \n",
148
+ "3 [vintage, classical, dramatic, ornate, elegant] \n",
149
+ "4 [Humorous, Educational, Whimsical, Nature-them... \n",
150
+ "\n",
151
+ " visual_characteristics \n",
152
+ "0 [Muted Color Palette, Vertical Layout, Serif T... \n",
153
+ "1 [white background, green accents, illustrative... \n",
154
+ "2 [subtle color palette, classic serif fonts, cl... \n",
155
+ "3 [dark color palette, gold accents, traditional... \n",
156
+ "4 [Vibrant color palette, Whimsical illustration... "
157
+ ]
158
+ },
159
+ "execution_count": 3,
160
+ "metadata": {},
161
+ "output_type": "execute_result"
162
+ }
163
+ ],
164
+ "source": [
165
+ "def load_design_data():\n",
166
+ " \"\"\"Load design data from the metadata files\"\"\"\n",
167
+ " designs_dir = Path.cwd().parent / \"src\" / \"data\" / \"designs\"\n",
168
+ " print(designs_dir)\n",
169
+ " designs = []\n",
170
+ " \n",
171
+ " # Load all metadata files\n",
172
+ " for design_dir in designs_dir.glob(\"**/metadata.json\"):\n",
173
+ " try:\n",
174
+ " with open(design_dir, \"r\") as f:\n",
175
+ " metadata = json.load(f)\n",
176
+ " \n",
177
+ " # Create a text representation of the design\n",
178
+ " text = f\"\"\"Design {metadata.get('id', 'unknown')}:\n",
179
+ " Description: {metadata.get('description', 'No description available')}\n",
180
+ " Categories: {', '.join(metadata.get('categories', []))}\n",
181
+ " Visual Characteristics: {', '.join(metadata.get('visual_characteristics', []))}\n",
182
+ " \"\"\"\n",
183
+ " \n",
184
+ " designs.append({\n",
185
+ " 'id': metadata.get('id', 'unknown'),\n",
186
+ " 'text': text.strip(),\n",
187
+ " 'categories': metadata.get('categories', []),\n",
188
+ " 'visual_characteristics': metadata.get('visual_characteristics', [])\n",
189
+ " })\n",
190
+ " except Exception as e:\n",
191
+ " print(f\"Error processing design {design_dir}: {e}\")\n",
192
+ " continue\n",
193
+ " \n",
194
+ " print(f\"Loaded {len(designs)} designs\")\n",
195
+ " return designs\n",
196
+ "\n",
197
+ "designs = load_design_data()\n",
198
+ "designs_df = pd.DataFrame(designs)\n",
199
+ "designs_df.head()"
200
+ ]
201
+ },
202
+ {
203
+ "cell_type": "markdown",
204
+ "metadata": {},
205
+ "source": [
206
+ "## 2. Create Training Pairs\n",
207
+ "\n",
208
+ "For fine-tuning, we need to create positive pairs (similar designs) and negative pairs (dissimilar designs). We'll use categories and visual characteristics to determine similarity."
209
+ ]
210
+ },
211
+ {
212
+ "cell_type": "code",
213
+ "execution_count": 8,
214
+ "metadata": {},
215
+ "outputs": [
216
+ {
217
+ "name": "stdout",
218
+ "output_type": "stream",
219
+ "text": [
220
+ "Creating training pairs...\n",
221
+ "Created 95 training examples and 27 evaluation examples\n"
222
+ ]
223
+ }
224
+ ],
225
+ "source": [
226
+ "from sentence_transformers import InputExample\n",
227
+ "def create_training_pairs(designs_df, num_pairs=5000):\n",
228
+ " \"\"\"Create training pairs for fine-tuning\"\"\"\n",
229
+ " training_pairs = []\n",
230
+ " design_ids = designs_df['id'].tolist()\n",
231
+ " \n",
232
+ " # Calculate similarity between designs based on categories and characteristics\n",
233
+ " def calculate_similarity(design1, design2):\n",
234
+ " # Get categories and characteristics for both designs\n",
235
+ " cats1 = set(design1['categories'])\n",
236
+ " cats2 = set(design2['categories'])\n",
237
+ " chars1 = set(design1['visual_characteristics'])\n",
238
+ " chars2 = set(design2['visual_characteristics'])\n",
239
+ " \n",
240
+ " # Calculate Jaccard similarity for categories and characteristics\n",
241
+ " cat_sim = len(cats1.intersection(cats2)) / max(1, len(cats1.union(cats2)))\n",
242
+ " char_sim = len(chars1.intersection(chars2)) / max(1, len(chars1.union(chars2)))\n",
243
+ " \n",
244
+ " # Weighted similarity\n",
245
+ " return 0.5 * cat_sim + 0.5 * char_sim\n",
246
+ " \n",
247
+ " # Create similarity matrix\n",
248
+ " import random\n",
249
+ " train_examples = []\n",
250
+ " eval_examples = []\n",
251
+ " \n",
252
+ " # Create positive pairs (similar designs)\n",
253
+ " for i in range(len(designs_df)):\n",
254
+ " design1 = designs_df.iloc[i].to_dict()\n",
255
+ " similarities = []\n",
256
+ " \n",
257
+ " for j in range(len(designs_df)):\n",
258
+ " if i != j:\n",
259
+ " design2 = designs_df.iloc[j].to_dict()\n",
260
+ " sim = calculate_similarity(design1, design2)\n",
261
+ " similarities.append((j, sim))\n",
262
+ " \n",
263
+ " # Sort by similarity\n",
264
+ " similarities.sort(key=lambda x: x[1], reverse=True)\n",
265
+ " \n",
266
+ " # Add top similar designs as positive pairs\n",
267
+ " for j, sim in similarities[:3]: # Top 3 most similar\n",
268
+ " if sim > 0.2: # Only if they're somewhat similar\n",
269
+ " design2 = designs_df.iloc[j].to_dict()\n",
270
+ " # Create InputExample with texts and similarity score\n",
271
+ " example = InputExample(texts=[design1['text'], design2['text']], label=float(sim))\n",
272
+ " \n",
273
+ " # 80% for training, 20% for evaluation\n",
274
+ " if random.random() < 0.8:\n",
275
+ " train_examples.append(example)\n",
276
+ " else:\n",
277
+ " eval_examples.append(example)\n",
278
+ " \n",
279
+ " print(f\"Created {len(train_examples)} training examples and {len(eval_examples)} evaluation examples\")\n",
280
+ " return train_examples, eval_examples\n",
281
+ "\n",
282
+ "print(\"Creating training pairs...\")\n",
283
+ "train_examples, eval_examples = create_training_pairs(designs_df) "
284
+ ]
285
+ },
286
+ {
287
+ "cell_type": "markdown",
288
+ "metadata": {},
289
+ "source": [
290
+ "## 3. Fine-tune the Model\n",
291
+ "\n",
292
+ "The model I've selected here is the distilbert-base-nli-stsb-mean-tokens model, chosen as a comparison because its BERT training is effective at semantic similarity. Performance isn't too important here, since we have one design per query and we want to return the best match."
293
+ ]
294
+ },
295
+ {
296
+ "cell_type": "code",
297
+ "execution_count": 10,
298
+ "metadata": {},
299
+ "outputs": [
300
+ {
301
+ "name": "stdout",
302
+ "output_type": "stream",
303
+ "text": [
304
+ "Starting model fine-tuning...\n",
305
+ "Loading base model: sentence-transformers/distilbert-base-nli-stsb-mean-tokens\n",
306
+ "\n",
307
+ "Training configuration:\n",
308
+ "- Training examples: 95\n",
309
+ "- Evaluation examples: 27\n",
310
+ "- Batch size: 16\n",
311
+ "- Warmup steps: 0\n",
312
+ "- Using GPU: False\n",
313
+ "- Model will be saved to: /Users/owner/Desktop/Projects/ai-maker-space/code/ImagineUI/src/fine_tuned_design_embeddings_20250225_161918\n"
314
+ ]
315
+ },
316
+ {
317
+ "data": {
318
+ "application/vnd.jupyter.widget-view+json": {
319
+ "model_id": "e4315da477764680aaacae97230e6409",
320
+ "version_major": 2,
321
+ "version_minor": 0
322
+ },
323
+ "text/plain": [
324
+ "Computing widget examples: 0%| | 0/1 [00:00<?, ?example/s]"
325
+ ]
326
+ },
327
+ "metadata": {},
328
+ "output_type": "display_data"
329
+ },
330
+ {
331
+ "data": {
332
+ "text/html": [
333
+ "\n",
334
+ " <div>\n",
335
+ " \n",
336
+ " <progress value='6' max='6' style='width:300px; height:20px; vertical-align: middle;'></progress>\n",
337
+ " [6/6 00:36, Epoch 1/1]\n",
338
+ " </div>\n",
339
+ " <table border=\"1\" class=\"dataframe\">\n",
340
+ " <thead>\n",
341
+ " <tr style=\"text-align: left;\">\n",
342
+ " <th>Step</th>\n",
343
+ " <th>Training Loss</th>\n",
344
+ " <th>Validation Loss</th>\n",
345
+ " <th>Pearson Cosine</th>\n",
346
+ " <th>Spearman Cosine</th>\n",
347
+ " </tr>\n",
348
+ " </thead>\n",
349
+ " <tbody>\n",
350
+ " <tr>\n",
351
+ " <td>6</td>\n",
352
+ " <td>No log</td>\n",
353
+ " <td>No log</td>\n",
354
+ " <td>-0.139605</td>\n",
355
+ " <td>-0.068639</td>\n",
356
+ " </tr>\n",
357
+ " </tbody>\n",
358
+ "</table><p>"
359
+ ],
360
+ "text/plain": [
361
+ "<IPython.core.display.HTML object>"
362
+ ]
363
+ },
364
+ "metadata": {},
365
+ "output_type": "display_data"
366
+ },
367
+ {
368
+ "name": "stdout",
369
+ "output_type": "stream",
370
+ "text": [
371
+ "\n",
372
+ "Training complete!\n",
373
+ "Model saved to /Users/owner/Desktop/Projects/ai-maker-space/code/ImagineUI/src/fine_tuned_design_embeddings_20250225_161918\n"
374
+ ]
375
+ }
376
+ ],
377
+ "source": [
378
+ "def fine_tune_model_simple(train_examples, eval_examples, base_model=\"sentence-transformers/distilbert-base-nli-stsb-mean-tokens\"):\n",
379
+ " \"\"\"Fine-tune a SentenceTransformer model\"\"\"\n",
380
+ " import os\n",
381
+ " import torch\n",
382
+ " from datetime import datetime\n",
383
+ " from sentence_transformers import SentenceTransformer, losses\n",
384
+ " from sentence_transformers.evaluation import EmbeddingSimilarityEvaluator\n",
385
+ " from torch.utils.data import DataLoader\n",
386
+ " \n",
387
+ " # Load the base model\n",
388
+ " print(f\"Loading base model: {base_model}\")\n",
389
+ " model = SentenceTransformer(base_model)\n",
390
+ " \n",
391
+ " # Create training dataloader\n",
392
+ " train_dataloader = DataLoader(train_examples, shuffle=True, batch_size=16)\n",
393
+ " \n",
394
+ " # Use CosineSimilarityLoss for fine-tuning\n",
395
+ " train_loss = losses.CosineSimilarityLoss(model)\n",
396
+ " \n",
397
+ " # Create evaluator\n",
398
+ " evaluator = EmbeddingSimilarityEvaluator.from_input_examples(eval_examples)\n",
399
+ " \n",
400
+ " # Create timestamped model save path\n",
401
+ " timestamp = datetime.now().strftime(\"%Y%m%d_%H%M%S\")\n",
402
+ " model_save_path = os.path.join(os.getcwd(), \"fine_tuned_design_embeddings_\" + timestamp)\n",
403
+ " \n",
404
+ " # Set up warm-up steps\n",
405
+ " warmup_steps = int(len(train_dataloader) * 0.1)\n",
406
+ "\n",
407
+ " print(f\"\\nTraining configuration:\")\n",
408
+ " print(f\"- Training examples: {len(train_examples)}\")\n",
409
+ " print(f\"- Evaluation examples: {len(eval_examples)}\")\n",
410
+ " print(f\"- Batch size: 16\")\n",
411
+ " print(f\"- Warmup steps: {warmup_steps}\")\n",
412
+ " print(f\"- Using GPU: {torch.cuda.is_available()}\")\n",
413
+ " print(f\"- Model will be saved to: {model_save_path}\")\n",
414
+ " \n",
415
+ " # Train the model\n",
416
+ " model.fit(\n",
417
+ " train_objectives=[(train_dataloader, train_loss)],\n",
418
+ " evaluator=evaluator,\n",
419
+ " epochs=1, # Start with just 1 epoch to test\n",
420
+ " warmup_steps=warmup_steps,\n",
421
+ " output_path=model_save_path,\n",
422
+ " show_progress_bar=True\n",
423
+ " )\n",
424
+ " \n",
425
+ " print(f\"\\nTraining complete!\")\n",
426
+ " print(f\"Model saved to {model_save_path}\")\n",
427
+ " \n",
428
+ " return model, model_save_path\n",
429
+ "\n",
430
+ "print(\"Starting model fine-tuning...\")\n",
431
+ "fine_tuned_model, model_path = fine_tune_model_simple(train_examples, eval_examples)\n"
432
+ ]
433
+ },
434
+ {
435
+ "cell_type": "markdown",
436
+ "metadata": {},
437
+ "source": [
438
+ "## 4. Evaluate Fine-tuned Model vs Base Model"
439
+ ]
440
+ },
441
+ {
442
+ "cell_type": "markdown",
443
+ "metadata": {},
444
+ "source": [
445
+ "We'll need nest_asyncio to run the async evaluation inside a Jupyter notebook."
446
+ ]
447
+ },
448
+ {
449
+ "cell_type": "code",
450
+ "execution_count": 14,
451
+ "metadata": {},
452
+ "outputs": [],
453
+ "source": [
454
+ "import nest_asyncio\n",
455
+ "nest_asyncio.apply()"
456
+ ]
457
+ },
458
+ {
459
+ "cell_type": "code",
460
+ "execution_count": 16,
461
+ "metadata": {},
462
+ "outputs": [],
463
+ "source": [
464
+ "# Now define a synchronous wrapper for our comparison function\n",
465
+ "def compare_models_sync(base_model_name, fine_tuned_model_path, test_queries):\n",
466
+ " \"\"\"Synchronous wrapper for compare_models\"\"\"\n",
467
+ " import asyncio\n",
468
+ " from langchain_openai import ChatOpenAI\n",
469
+ " import json\n",
470
+ " \n",
471
+ " # Load models\n",
472
+ " print(f\"Loading base model: {base_model_name}\")\n",
473
+ " base_model = SentenceTransformer(base_model_name)\n",
474
+ " \n",
475
+ " print(f\"Loading fine-tuned model from: {fine_tuned_model_path}\")\n",
476
+ " fine_tuned_model = SentenceTransformer(fine_tuned_model_path)\n",
477
+ " \n",
478
+ " # Initialize evaluator\n",
479
+ " llm = ChatOpenAI(model=\"gpt-4\", temperature=0)\n",
480
+ " \n",
481
+ " # Create a retrieval function using each model\n",
482
+ " def retrieve_with_model(model, query, k=1):\n",
483
+ " # Get embeddings for designs\n",
484
+ " design_texts = designs_df['text'].tolist()\n",
485
+ " design_embeddings = model.encode(design_texts, convert_to_tensor=True)\n",
486
+ " \n",
487
+ " # Get query embedding\n",
488
+ " query_embedding = model.encode(query, convert_to_tensor=True)\n",
489
+ " \n",
490
+ " # Calculate cosine similarities\n",
491
+ " cos_scores = torch.nn.functional.cosine_similarity(query_embedding.unsqueeze(0), design_embeddings)\n",
492
+ " \n",
493
+ " # Get top k designs\n",
494
+ " top_k_indices = torch.topk(cos_scores, k=k).indices.tolist()\n",
495
+ " \n",
496
+ " # Return top k designs\n",
497
+ " return [designs_df.iloc[i] for i in top_k_indices]\n",
498
+ " \n",
499
+ " # Evaluate a design match\n",
500
+ " async def evaluate_match(query, design):\n",
501
+ " prompt = f\"\"\"You are evaluating a design recommendation system.\n",
502
+ " \n",
503
+ " USER REQUIREMENTS:\n",
504
+ " {query}\n",
505
+ " \n",
506
+ " RECOMMENDED DESIGN:\n",
507
+ " {design['text']}\n",
508
+ " \n",
509
+ " Score how well the recommended design matches the user's requirements on a scale of 0-10.\n",
510
+ " Provide your score and brief explanation in JSON format exactly like this:\n",
511
+ " {{\n",
512
+ " \"score\": 7,\n",
513
+ " \"reason\": \"The design aligns with the requirements because...\"\n",
514
+ " }}\n",
515
+ " \n",
516
+ " Return only valid JSON, nothing else.\n",
517
+ " \"\"\"\n",
518
+ " \n",
519
+ " try:\n",
520
+ " response = await llm.ainvoke(prompt)\n",
521
+ " result = json.loads(response.content)\n",
522
+ " return result\n",
523
+ " except Exception as e:\n",
524
+ " print(f\"Error evaluating match: {e}\")\n",
525
+ " return {\"score\": 0, \"reason\": f\"Error parsing evaluation: {e}\"}\n",
526
+ " \n",
527
+ " # Test with both models\n",
528
+ " results = []\n",
529
+ " \n",
530
+ " # Define the evaluation function\n",
531
+ " async def evaluate_all_queries():\n",
532
+ " for i, query in enumerate(test_queries):\n",
533
+ " print(f\"Evaluating query {i+1}/{len(test_queries)}: {query[:50]}...\")\n",
534
+ " \n",
535
+ " # Get top result from each model\n",
536
+ " base_result = retrieve_with_model(base_model, query)[0]\n",
537
+ " fine_tuned_result = retrieve_with_model(fine_tuned_model, query)[0]\n",
538
+ " \n",
539
+ " # Evaluate matches\n",
540
+ " base_eval = await evaluate_match(query, base_result)\n",
541
+ " fine_tuned_eval = await evaluate_match(query, fine_tuned_result)\n",
542
+ " \n",
543
+ " # Store results\n",
544
+ " results.append({\n",
545
+ " \"query\": query,\n",
546
+ " \"base_model_id\": base_result['id'],\n",
547
+ " \"fine_tuned_model_id\": fine_tuned_result['id'],\n",
548
+ " \"base_score\": base_eval.get(\"score\", 0),\n",
549
+ " \"base_reason\": base_eval.get(\"reason\", \"Error\"),\n",
550
+ " \"fine_tuned_score\": fine_tuned_eval.get(\"score\", 0),\n",
551
+ " \"fine_tuned_reason\": fine_tuned_eval.get(\"reason\", \"Error\"),\n",
552
+ " \"models_differ\": base_result['id'] != fine_tuned_result['id']\n",
553
+ " })\n",
554
+ " \n",
555
+ " print(f\" Base model: Design {base_result['id']} - Score: {base_eval.get('score', 0)}\")\n",
556
+ " print(f\" Fine-tuned: Design {fine_tuned_result['id']} - Score: {fine_tuned_eval.get('score', 0)}\")\n",
557
+ " \n",
558
+ " # Run the async evaluation using the event loop\n",
559
+ " loop = asyncio.get_event_loop()\n",
560
+ " loop.run_until_complete(evaluate_all_queries())\n",
561
+ " \n",
562
+ " return pd.DataFrame(results)"
563
+ ]
564
+ },
565
+ {
566
+ "cell_type": "code",
567
+ "execution_count": 17,
568
+ "metadata": {},
569
+ "outputs": [
570
+ {
571
+ "name": "stdout",
572
+ "output_type": "stream",
573
+ "text": [
574
+ "Loading base model: sentence-transformers/distilbert-base-nli-stsb-mean-tokens\n",
575
+ "Loading fine-tuned model from: /Users/owner/Desktop/Projects/ai-maker-space/code/ImagineUI/src/fine_tuned_design_embeddings_20250225_161918\n",
576
+ "Evaluating query 1/8: I need a minimalist design with lots of whitespace...\n",
577
+ " Base model: Design 220 - Score: 8\n",
578
+ " Fine-tuned: Design 144 - Score: 9\n",
579
+ "Evaluating query 2/8: Looking for a playful, colorful design with rounde...\n",
580
+ " Base model: Design 129 - Score: 8\n",
581
+ " Fine-tuned: Design 129 - Score: 8\n",
582
+ "Evaluating query 3/8: Need a professional business design with a dark th...\n",
583
+ " Base model: Design 204 - Score: 8\n",
584
+ " Fine-tuned: Design 204 - Score: 8\n",
585
+ "Evaluating query 4/8: Want a nature-inspired design with organic shapes...\n",
586
+ " Base model: Design 190 - Score: 8\n",
587
+ " Fine-tuned: Design 215 - Score: 0\n",
588
+ "Evaluating query 5/8: Looking for a tech-focused design with a futuristi...\n",
589
+ " Base model: Design 012 - Score: 9\n",
590
+ " Fine-tuned: Design 012 - Score: 9\n",
591
+ "Evaluating query 6/8: I want the craziest design you can find...\n",
592
+ " Base model: Design 008 - Score: 8\n",
593
+ " Fine-tuned: Design 008 - Score: 8\n",
594
+ "Evaluating query 7/8: I'd like an eye-catching design for a small busine...\n",
595
+ " Base model: Design 006 - Score: 8\n",
596
+ " Fine-tuned: Design 006 - Score: 8\n",
597
+ "Evaluating query 8/8: I want something clinical and informative...\n",
598
+ " Base model: Design 130 - Score: 8\n",
599
+ " Fine-tuned: Design 004 - Score: 8\n"
600
+ ]
601
+ },
602
+ {
603
+ "data": {
604
+ "text/html": [
605
+ "<div>\n",
606
+ "<style scoped>\n",
607
+ " .dataframe tbody tr th:only-of-type {\n",
608
+ " vertical-align: middle;\n",
609
+ " }\n",
610
+ "\n",
611
+ " .dataframe tbody tr th {\n",
612
+ " vertical-align: top;\n",
613
+ " }\n",
614
+ "\n",
615
+ " .dataframe thead th {\n",
616
+ " text-align: right;\n",
617
+ " }\n",
618
+ "</style>\n",
619
+ "<table border=\"1\" class=\"dataframe\">\n",
620
+ " <thead>\n",
621
+ " <tr style=\"text-align: right;\">\n",
622
+ " <th></th>\n",
623
+ " <th>query</th>\n",
624
+ " <th>base_model_id</th>\n",
625
+ " <th>fine_tuned_model_id</th>\n",
626
+ " <th>base_score</th>\n",
627
+ " <th>base_reason</th>\n",
628
+ " <th>fine_tuned_score</th>\n",
629
+ " <th>fine_tuned_reason</th>\n",
630
+ " <th>models_differ</th>\n",
631
+ " </tr>\n",
632
+ " </thead>\n",
633
+ " <tbody>\n",
634
+ " <tr>\n",
635
+ " <th>0</th>\n",
636
+ " <td>I need a minimalist design with lots of whites...</td>\n",
637
+ " <td>220</td>\n",
638
+ " <td>144</td>\n",
639
+ " <td>8</td>\n",
640
+ " <td>The design aligns with the user's requirements...</td>\n",
641
+ " <td>9</td>\n",
642
+ " <td>The recommended design matches the user's requ...</td>\n",
643
+ " <td>True</td>\n",
644
+ " </tr>\n",
645
+ " <tr>\n",
646
+ " <th>1</th>\n",
647
+ " <td>Looking for a playful, colorful design with ro...</td>\n",
648
+ " <td>129</td>\n",
649
+ " <td>129</td>\n",
650
+ " <td>8</td>\n",
651
+ " <td>The design aligns with the user's requirements...</td>\n",
652
+ " <td>8</td>\n",
653
+ " <td>The design aligns with the user's requirements...</td>\n",
654
+ " <td>False</td>\n",
655
+ " </tr>\n",
656
+ " <tr>\n",
657
+ " <th>2</th>\n",
658
+ " <td>Need a professional business design with a dar...</td>\n",
659
+ " <td>204</td>\n",
660
+ " <td>204</td>\n",
661
+ " <td>8</td>\n",
662
+ " <td>The design aligns with the user's requirements...</td>\n",
663
+ " <td>8</td>\n",
664
+ " <td>The design aligns with the user's requirements...</td>\n",
665
+ " <td>False</td>\n",
666
+ " </tr>\n",
667
+ " <tr>\n",
668
+ " <th>3</th>\n",
669
+ " <td>Want a nature-inspired design with organic shapes</td>\n",
670
+ " <td>190</td>\n",
671
+ " <td>215</td>\n",
672
+ " <td>8</td>\n",
673
+ " <td>The design aligns with the user's requirements...</td>\n",
674
+ " <td>0</td>\n",
675
+ " <td>The recommended design does not match the user...</td>\n",
676
+ " <td>True</td>\n",
677
+ " </tr>\n",
678
+ " <tr>\n",
679
+ " <th>4</th>\n",
680
+ " <td>Looking for a tech-focused design with a futur...</td>\n",
681
+ " <td>012</td>\n",
682
+ " <td>012</td>\n",
683
+ " <td>9</td>\n",
684
+ " <td>The recommended design aligns very well with t...</td>\n",
685
+ " <td>9</td>\n",
686
+ " <td>The recommended design aligns very well with t...</td>\n",
687
+ " <td>False</td>\n",
688
+ " </tr>\n",
689
+ " <tr>\n",
690
+ " <th>5</th>\n",
691
+ " <td>I want the craziest design you can find</td>\n",
692
+ " <td>008</td>\n",
693
+ " <td>008</td>\n",
694
+ " <td>8</td>\n",
695
+ " <td>The design aligns with the user's requirements...</td>\n",
696
+ " <td>8</td>\n",
697
+ " <td>The recommended design matches the user's requ...</td>\n",
698
+ " <td>False</td>\n",
699
+ " </tr>\n",
700
+ " <tr>\n",
701
+ " <th>6</th>\n",
702
+ " <td>I'd like an eye-catching design for a small bu...</td>\n",
703
+ " <td>006</td>\n",
704
+ " <td>006</td>\n",
705
+ " <td>8</td>\n",
706
+ " <td>The recommended design matches the user's requ...</td>\n",
707
+ " <td>8</td>\n",
708
+ " <td>The recommended design matches the user's requ...</td>\n",
709
+ " <td>False</td>\n",
710
+ " </tr>\n",
711
+ " <tr>\n",
712
+ " <th>7</th>\n",
713
+ " <td>I want something clinical and informative</td>\n",
714
+ " <td>130</td>\n",
715
+ " <td>004</td>\n",
716
+ " <td>8</td>\n",
717
+ " <td>The recommended design matches the user's requ...</td>\n",
718
+ " <td>8</td>\n",
719
+ " <td>The design aligns with the user's requirements...</td>\n",
720
+ " <td>True</td>\n",
721
+ " </tr>\n",
722
+ " </tbody>\n",
723
+ "</table>\n",
724
+ "</div>"
725
+ ],
726
+ "text/plain": [
727
+ " query base_model_id \\\n",
728
+ "0 I need a minimalist design with lots of whites... 220 \n",
729
+ "1 Looking for a playful, colorful design with ro... 129 \n",
730
+ "2 Need a professional business design with a dar... 204 \n",
731
+ "3 Want a nature-inspired design with organic shapes 190 \n",
732
+ "4 Looking for a tech-focused design with a futur... 012 \n",
733
+ "5 I want the craziest design you can find 008 \n",
734
+ "6 I'd like an eye-catching design for a small bu... 006 \n",
735
+ "7 I want something clinical and informative 130 \n",
736
+ "\n",
737
+ " fine_tuned_model_id base_score \\\n",
738
+ "0 144 8 \n",
739
+ "1 129 8 \n",
740
+ "2 204 8 \n",
741
+ "3 215 8 \n",
742
+ "4 012 9 \n",
743
+ "5 008 8 \n",
744
+ "6 006 8 \n",
745
+ "7 004 8 \n",
746
+ "\n",
747
+ " base_reason fine_tuned_score \\\n",
748
+ "0 The design aligns with the user's requirements... 9 \n",
749
+ "1 The design aligns with the user's requirements... 8 \n",
750
+ "2 The design aligns with the user's requirements... 8 \n",
751
+ "3 The design aligns with the user's requirements... 0 \n",
752
+ "4 The recommended design aligns very well with t... 9 \n",
753
+ "5 The design aligns with the user's requirements... 8 \n",
754
+ "6 The recommended design matches the user's requ... 8 \n",
755
+ "7 The recommended design matches the user's requ... 8 \n",
756
+ "\n",
757
+ " fine_tuned_reason models_differ \n",
758
+ "0 The recommended design matches the user's requ... True \n",
759
+ "1 The design aligns with the user's requirements... False \n",
760
+ "2 The design aligns with the user's requirements... False \n",
761
+ "3 The recommended design does not match the user... True \n",
762
+ "4 The recommended design aligns very well with t... False \n",
763
+ "5 The recommended design matches the user's requ... False \n",
764
+ "6 The recommended design matches the user's requ... False \n",
765
+ "7 The design aligns with the user's requirements... True "
766
+ ]
767
+ },
768
+ "execution_count": 17,
769
+ "metadata": {},
770
+ "output_type": "execute_result"
771
+ }
772
+ ],
773
+ "source": [
774
+ "\n",
775
+ "test_queries = [\n",
776
+ " \"I need a minimalist design with lots of whitespace\",\n",
777
+ " \"Looking for a playful, colorful design with rounded elements\",\n",
778
+ " \"Need a professional business design with a dark theme\",\n",
779
+ " \"Want a nature-inspired design with organic shapes\",\n",
780
+ " \"Looking for a tech-focused design with a futuristic feel\",\n",
781
+ " \"I want the craziest design you can find\",\n",
782
+ " \"I'd like an eye-catching design for a small business\",\n",
783
+ " \"I want something clinical and informative\"\n",
784
+ "]\n",
785
+ "\n",
786
+ "comparison_results = compare_models_sync(\"sentence-transformers/distilbert-base-nli-stsb-mean-tokens\", model_path, test_queries)\n",
787
+ "comparison_results"
788
+ ]
789
+ },
790
+ {
791
+ "cell_type": "markdown",
792
+ "metadata": {},
793
+ "source": [
794
+ "Using this, we can verify the returned design of each model and query. A standout element is the \"0\" scored by the fine-tuned model for query #3. Checking the returned design, it's definitely not the nature-inspired design we were looking for. The model without fine-tuning hasn't missed a query that badly, so it's unclear why the training moved in the wrong direction."
795
+ ]
796
+ },
797
+ {
798
+ "cell_type": "markdown",
799
+ "metadata": {},
800
+ "source": [
801
+ "## 5. Visualize Comparison Results"
802
+ ]
803
+ },
804
+ {
805
+ "cell_type": "code",
806
+ "execution_count": 18,
807
+ "metadata": {},
808
+ "outputs": [
809
+ {
810
+ "data": {
811
+ "image/png": "",
812
+ "text/plain": [
813
+ "<Figure size 1000x600 with 2 Axes>"
814
+ ]
815
+ },
816
+ "metadata": {},
817
+ "output_type": "display_data"
818
+ },
819
+ {
820
+ "name": "stdout",
821
+ "output_type": "stream",
822
+ "text": [
823
+ "Average Base Model Score: 8.12\n",
824
+ "Average Fine-tuned Model Score: 7.25\n",
825
+ "Average Improvement: -0.88 (-10.8%)\n"
826
+ ]
827
+ }
828
+ ],
829
+ "source": [
830
+ "# Visualize comparison results\n",
831
+ "plt.figure(figsize=(10, 6))\n",
832
+ "\n",
833
+ "# Calculate improvement\n",
834
+ "comparison_results['improvement'] = comparison_results['fine_tuned_score'] - comparison_results['base_score']\n",
835
+ "\n",
836
+ "# Bar chart comparing scores\n",
837
+ "plt.subplot(1, 2, 1)\n",
838
+ "x = np.arange(len(comparison_results))\n",
839
+ "width = 0.35\n",
840
+ "\n",
841
+ "plt.bar(x - width/2, comparison_results['base_score'], width, label='Base Model')\n",
842
+ "plt.bar(x + width/2, comparison_results['fine_tuned_score'], width, label='Fine-tuned Model')\n",
843
+ "\n",
844
+ "plt.xlabel('Query')\n",
845
+ "plt.ylabel('Score (0-10)')\n",
846
+ "plt.title('Base vs Fine-tuned Model Performance')\n",
847
+ "plt.xticks(x, range(1, len(comparison_results) + 1))\n",
848
+ "plt.legend()\n",
849
+ "\n",
850
+ "# Improvement chart\n",
851
+ "plt.subplot(1, 2, 2)\n",
852
+ "colors = ['green' if x > 0 else 'red' for x in comparison_results['improvement']]\n",
853
+ "plt.bar(range(1, len(comparison_results) + 1), comparison_results['improvement'], color=colors)\n",
854
+ "plt.axhline(y=0, color='k', linestyle='-', alpha=0.3)\n",
855
+ "plt.xlabel('Query')\n",
856
+ "plt.ylabel('Score Improvement')\n",
857
+ "plt.title('Fine-tuned Model Improvement')\n",
858
+ "\n",
859
+ "plt.tight_layout()\n",
860
+ "plt.show()\n",
861
+ "\n",
862
+ "# Show overall improvement\n",
863
+ "avg_base_score = comparison_results['base_score'].mean()\n",
864
+ "avg_fine_tuned_score = comparison_results['fine_tuned_score'].mean()\n",
865
+ "avg_improvement = avg_fine_tuned_score - avg_base_score\n",
866
+ "\n",
867
+ "print(f\"Average Base Model Score: {avg_base_score:.2f}\")\n",
868
+ "print(f\"Average Fine-tuned Model Score: {avg_fine_tuned_score:.2f}\")\n",
869
+ "print(f\"Average Improvement: {avg_improvement:.2f} ({avg_improvement/avg_base_score*100:.1f}%)\")"
870
+ ]
871
+ },
872
+ {
873
+ "cell_type": "markdown",
874
+ "metadata": {},
875
+ "source": [
876
+ "## Conclusion\n",
877
+ "\n",
878
+ "We were able to train a fine-tuned model on our queries and designs, but the results were disappointing. We don't want to launch an embedding model that hurts our performance so we'll stick with the existing rag agent. But with more queries, more data, and testing more models, there may be a way to find improvements."
879
+ ]
880
+ }
881
+ ],
882
+ "metadata": {
883
+ "kernelspec": {
884
+ "display_name": ".venv",
885
+ "language": "python",
886
+ "name": "python3"
887
+ },
888
+ "language_info": {
889
+ "codemirror_mode": {
890
+ "name": "ipython",
891
+ "version": 3
892
+ },
893
+ "file_extension": ".py",
894
+ "mimetype": "text/x-python",
895
+ "name": "python",
896
+ "nbconvert_exporter": "python",
897
+ "pygments_lexer": "ipython3",
898
+ "version": "3.11.11"
899
+ }
900
+ },
901
+ "nbformat": 4,
902
+ "nbformat_minor": 4
903
+ }
src/fine_tuned_design_embeddings_20250225_161918/1_Pooling/config.json ADDED
@@ -0,0 +1,10 @@
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "word_embedding_dimension": 768,
3
+ "pooling_mode_cls_token": false,
4
+ "pooling_mode_mean_tokens": true,
5
+ "pooling_mode_max_tokens": false,
6
+ "pooling_mode_mean_sqrt_len_tokens": false,
7
+ "pooling_mode_weightedmean_tokens": false,
8
+ "pooling_mode_lasttoken": false,
9
+ "include_prompt": true
10
+ }
src/fine_tuned_design_embeddings_20250225_161918/README.md ADDED
@@ -0,0 +1,533 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ tags:
3
+ - sentence-transformers
4
+ - sentence-similarity
5
+ - feature-extraction
6
+ - generated_from_trainer
7
+ - dataset_size:95
8
+ - loss:CosineSimilarityLoss
9
+ base_model: sentence-transformers/distilbert-base-nli-stsb-mean-tokens
10
+ widget:
11
+ - source_sentence: "Design 115:\n Description: The design utilizes a dramatic\
12
+ \ red and black color palette, creating a high contrast and visually striking\
13
+ \ interface that emphasizes boldness and clarity. The layout is structured with\
14
+ \ a central column for main content and a sidebar for navigation, enhancing usability.\
15
+ \ Typography is classic and easy to read, using white text for legibility against\
16
+ \ dark backgrounds. The design features subtle gradient backgrounds and occasional\
17
+ \ fiery imagery, contributing to a dynamic and modern aesthetic.\n \
18
+ \ Categories: Web Design, Minimalist, Modern, Typography\n Visual Characteristics:\
19
+ \ High Contrast, Central Column Layout, Bold Typography, Red and Black Palette,\
20
+ \ Gradient Background"
21
+ sentences:
22
+ - "Design 185:\n Description: The design features a bold contrast between\
23
+ \ a bright blue header and a predominantly black background, creating a modern\
24
+ \ and striking visual impact. The use of crisp typography in white enhances readability\
25
+ \ against the dark backdrop, while an accent of orange in a sidebar provides additional\
26
+ \ contrast and attention-grabbing potential. The layout follows a structured and\
27
+ \ logical arrangement, guiding the viewer's eye through a series of selectable\
28
+ \ design options and resource links, creating a user-friendly and engaging experience.\n\
29
+ \ Categories: Modern, Typography, Web Design, Classic, User Friendly\n\
30
+ \ Visual Characteristics: High Contrast, Bold Colors, Structured Layout,\
31
+ \ Readable Typography, Accent Highlights"
32
+ - "Design 002:\n Description: The design embodies a serene and focused\
33
+ \ aesthetic with a soft, warm color scheme and straightforward typography. A prominent\
34
+ \ header creates an inviting entry point, while the balanced layout effectively\
35
+ \ organizes the content. Subtle shadows and borders provide depth, enhancing visual\
36
+ \ appeal without overwhelming the viewer.\n Categories: Web Design,\
37
+ \ Minimalism, Typography, Navigation\n Visual Characteristics: Warm\
38
+ \ color palette, Minimalistic layout, Simplicity, Balanced whitespace"
39
+ - "Design 200:\n Description: The design features a vibrant blue color\
40
+ \ scheme complemented by white and black typography, creating a striking contrast.\
41
+ \ The use of textured borders and background effects adds depth and visual interest.\
42
+ \ The layout is organized, with distinct sections for text content that enhance\
43
+ \ readability. The design reflects a modern and clean aesthetic, offering a sense\
44
+ \ of technological advancement and innovation.\n Categories: Modern,\
45
+ \ Typography, Web Design, Colorful\n Visual Characteristics: Vibrant\
46
+ \ Color, Textured Background, High Contrast, Organized Layout"
47
+ - source_sentence: "Design 142:\n Description: The design effortlessly\
48
+ \ combines a dark, textured background with bold, contrasting typography, creating\
49
+ \ a visually striking and modern aesthetic. The use of minimalist elements and\
50
+ \ a focused color palette emphasizes the central text, while the overall layout\
51
+ \ feels balanced and sophisticated.\n Categories: Modern, Minimalist,\
52
+ \ Typography-focused, Dark theme\n Visual Characteristics: Textured\
53
+ \ background, Contrasting colors, Bold typography, Sophisticated layout"
54
+ sentences:
55
+ - "Design 106:\n Description: This design features a minimalist and retro\
56
+ \ aesthetic with a muted color palette predominantly composed of olive green and\
57
+ \ subtle contrasts. The layout utilizes clean, sans-serif typography and a straightforward\
58
+ \ column format to present information in a clear and organized manner. The overall\
59
+ \ style evokes a calm and contemplative mood, reminiscent of classic web designs,\
60
+ \ with an emphasis on simplicity and readability.\n Categories: Minimalism,\
61
+ \ Retro, Web Design, Typography, Information Design\n Visual Characteristics:\
62
+ \ Muted color palette, Clean typography, Column layout, Simple navigation, Classic\
63
+ \ aesthetic"
64
+ - "Design 009:\n Description: This design features a clean and organized\
65
+ \ layout with a classic monochrome color palette, emphasizing the elegance of\
66
+ \ CSS design. It uses serif typography for a traditional feel, with strong visual\
67
+ \ separation of sections, enhancing readability. The design incorporates ornamental\
68
+ \ graphics at the top and bottom, adding a touch of sophistication. The ample\
69
+ \ use of whitespace contributes to a serene and uncluttered experience, inviting\
70
+ \ users to engage with the content.\n Categories: Web Design, Typography,\
71
+ \ Minimalism, Ornamental Design, Monochrome\n Visual Characteristics:\
72
+ \ Serif Typography, Monochromatic Palette, Ornamental Graphics, Whitespace Usage,\
73
+ \ Classic Layout"
74
+ - "Design 184:\n Description: The design features a subtle and harmonious\
75
+ \ aesthetic using a pastel green color scheme that evokes tranquility and balance.\
76
+ \ The layout is clean and structured, with a mix of serif and sans-serif typography\
77
+ \ that enhances readability. Decorative elements like the zen-like symbol and\
78
+ \ soft imagery provide an abstract, soothing quality, contributing to the theme\
79
+ \ of enlightenment and calm. This design is suited for audiences interested in\
80
+ \ modern CSS design principles and invites exploration and participation.\n \
81
+ \ Categories: Minimalist, Modern, Educational, Web-focused\n \
82
+ \ Visual Characteristics: Subtle color palette, Sophisticated typography, Clean\
83
+ \ layout, Zen imagery, Textured background"
84
+ - source_sentence: "Design 122:\n Description: The design features a minimalist\
85
+ \ aesthetic with a dominant white space, paired with subtle green accents and\
86
+ \ a hint of red, creating a clean and sophisticated look. The layout is vertical\
87
+ \ and structured, highlighting content purposefully with ample spacing, making\
88
+ \ it easy to read and navigate. The typography is elegant, using a serif font\
89
+ \ for headings to contrast with a simpler body text, supporting a Zen-like theme\
90
+ \ that embodies simplicity and clarity.\n Categories: minimalist, sophisticated,\
91
+ \ text-focused, zen-inspired\n Visual Characteristics: vertical layout,\
92
+ \ white space, green and red accents, serif typography"
93
+ sentences:
94
+ - "Design 195:\n Description: The design exemplifies a clean and minimalistic\
95
+ \ style, highlighting simplicity and readability through a dominance of white\
96
+ \ space and light, pastel background textures. It integrates a single-column layout\
97
+ \ with a sidebar for easy navigation, using a consistent and harmonious color\
98
+ \ palette composed mainly of soft greens, oranges, and muted text colors to ensure\
99
+ \ a smooth visual experience.\n Categories: Minimalist, Web Design,\
100
+ \ Modern, Typography\n Visual Characteristics: Simple Layout, Light\
101
+ \ Color Palette, Ample White Space, Readable Typography"
102
+ - "Design 187:\n Description: The design features a mystical, nature-inspired\
103
+ \ theme with a rustic color palette of dark greens and earthy reds. Intricate\
104
+ \ textures and foliage imagery offer a sense of depth, complemented by elegant\
105
+ \ serif typography that conveys a classic and sophisticated mood. The layout uses\
106
+ \ clear sections for content, enhancing readability and user engagement.\n \
107
+ \ Categories: Nature, Mystical, Classic, Rustic, Elegant\n \
108
+ \ Visual Characteristics: Dark Green Palette, Earthy Red Accents, Serif Typography,\
109
+ \ Textured Background, Nature Imagery"
110
+ - "Design 162:\n Description: The design embodies a classic, elegant\
111
+ \ style with a warm color palette dominated by earthy tones, enhanced by an ornate\
112
+ \ decorative header image. It uses a narrow column layout that focuses attention\
113
+ \ on the textual content, which is complemented by a textured background, adding\
114
+ \ depth and sophistication. The typography combines bold headings with a serif\
115
+ \ font, lending an old-world charm that aligns with the historical and sophisticated\
116
+ \ mood.\n Categories: classic, elegant, historical, sophisticated,\
117
+ \ text-focused\n Visual Characteristics: earthy color palette, ornate\
118
+ \ header, textured background, serif typography, narrow column layout"
119
+ - source_sentence: "Design 137:\n Description: The design presents a sleek,\
120
+ \ unified aesthetic utilizing a blue monochromatic color palette, giving it a\
121
+ \ modern and tech-centric appeal. Clean, crisp typography paired with visually\
122
+ \ engaging graphics contribute to its overall appeal, while the structured layout\
123
+ \ effectively organizes content for easy navigation and readability.\n \
124
+ \ Categories: Modern, Tech, Minimalist, Corporate, Professional\n \
125
+ \ Visual Characteristics: Monochromatic color scheme, Structured layout, Modern\
126
+ \ typography, High contrast, Tech-inspired graphics"
127
+ sentences:
128
+ - "Design 184:\n Description: The design features a subtle and harmonious\
129
+ \ aesthetic using a pastel green color scheme that evokes tranquility and balance.\
130
+ \ The layout is clean and structured, with a mix of serif and sans-serif typography\
131
+ \ that enhances readability. Decorative elements like the zen-like symbol and\
132
+ \ soft imagery provide an abstract, soothing quality, contributing to the theme\
133
+ \ of enlightenment and calm. This design is suited for audiences interested in\
134
+ \ modern CSS design principles and invites exploration and participation.\n \
135
+ \ Categories: Minimalist, Modern, Educational, Web-focused\n \
136
+ \ Visual Characteristics: Subtle color palette, Sophisticated typography, Clean\
137
+ \ layout, Zen imagery, Textured background"
138
+ - "Design 175:\n Description: The design showcases a balanced layout\
139
+ \ with a minimalist aesthetic, focused on demonstrating the power of CSS-based\
140
+ \ design. It features a clean and organized structure with a dominant use of blues\
141
+ \ and whites, complemented by modern, sans-serif typography. Silhouetted figures\
142
+ \ add a visual interest while maintaining a professional tone, making the page\
143
+ \ feel sophisticated and informative. The layout is well-suited for showcasing\
144
+ \ text content effectively, facilitating easy navigation through clear hierarchy.\n\
145
+ \ Categories: Minimalist, Technology, Informational, Professional,\
146
+ \ Modern\n Visual Characteristics: Clean layout, Balanced color palette,\
147
+ \ Silhouette imagery, Sans-serif typography, Organized structure"
148
+ - "Design 009:\n Description: This design features a clean and organized\
149
+ \ layout with a classic monochrome color palette, emphasizing the elegance of\
150
+ \ CSS design. It uses serif typography for a traditional feel, with strong visual\
151
+ \ separation of sections, enhancing readability. The design incorporates ornamental\
152
+ \ graphics at the top and bottom, adding a touch of sophistication. The ample\
153
+ \ use of whitespace contributes to a serene and uncluttered experience, inviting\
154
+ \ users to engage with the content.\n Categories: Web Design, Typography,\
155
+ \ Minimalism, Ornamental Design, Monochrome\n Visual Characteristics:\
156
+ \ Serif Typography, Monochromatic Palette, Ornamental Graphics, Whitespace Usage,\
157
+ \ Classic Layout"
158
+ - source_sentence: "Design 170:\n Description: The design of the CSS Zen\
159
+ \ Garden is exemplary with its soothing blue tones, providing a calm and professional\
160
+ \ aesthetic. The heart icons add a touch of creativity and warmth. The layout\
161
+ \ is clean and well-structured with clear navigation on the right-hand side, providing\
162
+ \ users easy access to additional information and style sheets. The typography\
163
+ \ varies, highlighting key sections and maintaining readability throughout.\n\
164
+ \ Categories: Web Design, CSS Showcase, Typography, User Interface,\
165
+ \ Aesthetic\n Visual Characteristics: Soothing Color Palette, Structured\
166
+ \ Layout, Iconography, Hierarchical Typography, Calming Aesthetic"
167
+ sentences:
168
+ - "Design 122:\n Description: The design features a minimalist aesthetic\
169
+ \ with a dominant white space, paired with subtle green accents and a hint of\
170
+ \ red, creating a clean and sophisticated look. The layout is vertical and structured,\
171
+ \ highlighting content purposefully with ample spacing, making it easy to read\
172
+ \ and navigate. The typography is elegant, using a serif font for headings to\
173
+ \ contrast with a simpler body text, supporting a Zen-like theme that embodies\
174
+ \ simplicity and clarity.\n Categories: minimalist, sophisticated,\
175
+ \ text-focused, zen-inspired\n Visual Characteristics: vertical layout,\
176
+ \ white space, green and red accents, serif typography"
177
+ - "Design 194:\n Description: This design exudes a minimalist elegance\
178
+ \ with a muted, earthy color palette and a clean layout, embodying a sense of\
179
+ \ calm and sophistication. The subtle use of textures and classic serif typography\
180
+ \ enhances the refined aesthetic, while the centered alignment and generous spacing\
181
+ \ contribute to a relaxed readability. The incorporation of a delicate floral\
182
+ \ illustration adds a touch of organic charm, making the design feel both timeless\
183
+ \ and inviting.\n Categories: Minimalism, Elegant, Organic, Sophisticated,\
184
+ \ Classic\n Visual Characteristics: Muted Color Palette, Serif Typography,\
185
+ \ Centered Layout, Generous Spacing, Floral Illustration"
186
+ - "Design 143:\n Description: This design features a clean and structured\
187
+ \ layout with a monochromatic color scheme, highlighting text content with clear\
188
+ \ typographic hierarchy. A combination of minimalist aesthetic and functional\
189
+ \ design elements ensures readability and visual interest, while the central image\
190
+ \ adds a focal point. The use of borders and shadow effects provide depth to the\
191
+ \ overall design.\n Categories: Minimalism, Monochrome, Typography,\
192
+ \ Web Design, User Interface\n Visual Characteristics: Clear typographic\
193
+ \ hierarchy, Grid alignment, Monochromatic color scheme, Minimalist style, Use\
194
+ \ of borders, Shadow effects"
195
+ pipeline_tag: sentence-similarity
196
+ library_name: sentence-transformers
197
+ metrics:
198
+ - pearson_cosine
199
+ - spearman_cosine
200
+ model-index:
201
+ - name: SentenceTransformer based on sentence-transformers/distilbert-base-nli-stsb-mean-tokens
202
+ results:
203
+ - task:
204
+ type: semantic-similarity
205
+ name: Semantic Similarity
206
+ dataset:
207
+ name: Unknown
208
+ type: unknown
209
+ metrics:
210
+ - type: pearson_cosine
211
+ value: -0.13960523700017818
212
+ name: Pearson Cosine
213
+ - type: spearman_cosine
214
+ value: -0.06863870136546027
215
+ name: Spearman Cosine
216
+ ---
217
+
218
+ # SentenceTransformer based on sentence-transformers/distilbert-base-nli-stsb-mean-tokens
219
+
220
+ This is a [sentence-transformers](https://www.SBERT.net) model finetuned from [sentence-transformers/distilbert-base-nli-stsb-mean-tokens](https://huggingface.co/sentence-transformers/distilbert-base-nli-stsb-mean-tokens). It maps sentences & paragraphs to a 768-dimensional dense vector space and can be used for semantic textual similarity, semantic search, paraphrase mining, text classification, clustering, and more.
221
+
222
+ ## Model Details
223
+
224
+ ### Model Description
225
+ - **Model Type:** Sentence Transformer
226
+ - **Base model:** [sentence-transformers/distilbert-base-nli-stsb-mean-tokens](https://huggingface.co/sentence-transformers/distilbert-base-nli-stsb-mean-tokens) <!-- at revision cb8a28f4e13e28fde6137942584fc8a4ec701060 -->
227
+ - **Maximum Sequence Length:** 128 tokens
228
+ - **Output Dimensionality:** 768 dimensions
229
+ - **Similarity Function:** Cosine Similarity
230
+ <!-- - **Training Dataset:** Unknown -->
231
+ <!-- - **Language:** Unknown -->
232
+ <!-- - **License:** Unknown -->
233
+
234
+ ### Model Sources
235
+
236
+ - **Documentation:** [Sentence Transformers Documentation](https://sbert.net)
237
+ - **Repository:** [Sentence Transformers on GitHub](https://github.com/UKPLab/sentence-transformers)
238
+ - **Hugging Face:** [Sentence Transformers on Hugging Face](https://huggingface.co/models?library=sentence-transformers)
239
+
240
+ ### Full Model Architecture
241
+
242
+ ```
243
+ SentenceTransformer(
244
+ (0): Transformer({'max_seq_length': 128, 'do_lower_case': False}) with Transformer model: DistilBertModel
245
+ (1): Pooling({'word_embedding_dimension': 768, 'pooling_mode_cls_token': False, 'pooling_mode_mean_tokens': True, 'pooling_mode_max_tokens': False, 'pooling_mode_mean_sqrt_len_tokens': False, 'pooling_mode_weightedmean_tokens': False, 'pooling_mode_lasttoken': False, 'include_prompt': True})
246
+ )
247
+ ```
248
+
249
+ ## Usage
250
+
251
+ ### Direct Usage (Sentence Transformers)
252
+
253
+ First install the Sentence Transformers library:
254
+
255
+ ```bash
256
+ pip install -U sentence-transformers
257
+ ```
258
+
259
+ Then you can load this model and run inference.
260
+ ```python
261
+ from sentence_transformers import SentenceTransformer
262
+
263
+ # Download from the 🤗 Hub
264
+ model = SentenceTransformer("sentence_transformers_model_id")
265
+ # Run inference
266
+ sentences = [
267
+ 'Design 170:\n Description: The design of the CSS Zen Garden is exemplary with its soothing blue tones, providing a calm and professional aesthetic. The heart icons add a touch of creativity and warmth. The layout is clean and well-structured with clear navigation on the right-hand side, providing users easy access to additional information and style sheets. The typography varies, highlighting key sections and maintaining readability throughout.\n Categories: Web Design, CSS Showcase, Typography, User Interface, Aesthetic\n Visual Characteristics: Soothing Color Palette, Structured Layout, Iconography, Hierarchical Typography, Calming Aesthetic',
268
+ 'Design 143:\n Description: This design features a clean and structured layout with a monochromatic color scheme, highlighting text content with clear typographic hierarchy. A combination of minimalist aesthetic and functional design elements ensures readability and visual interest, while the central image adds a focal point. The use of borders and shadow effects provide depth to the overall design.\n Categories: Minimalism, Monochrome, Typography, Web Design, User Interface\n Visual Characteristics: Clear typographic hierarchy, Grid alignment, Monochromatic color scheme, Minimalist style, Use of borders, Shadow effects',
269
+ 'Design 194:\n Description: This design exudes a minimalist elegance with a muted, earthy color palette and a clean layout, embodying a sense of calm and sophistication. The subtle use of textures and classic serif typography enhances the refined aesthetic, while the centered alignment and generous spacing contribute to a relaxed readability. The incorporation of a delicate floral illustration adds a touch of organic charm, making the design feel both timeless and inviting.\n Categories: Minimalism, Elegant, Organic, Sophisticated, Classic\n Visual Characteristics: Muted Color Palette, Serif Typography, Centered Layout, Generous Spacing, Floral Illustration',
270
+ ]
271
+ embeddings = model.encode(sentences)
272
+ print(embeddings.shape)
273
+ # [3, 768]
274
+
275
+ # Get the similarity scores for the embeddings
276
+ similarities = model.similarity(embeddings, embeddings)
277
+ print(similarities.shape)
278
+ # [3, 3]
279
+ ```
280
+
281
+ <!--
282
+ ### Direct Usage (Transformers)
283
+
284
+ <details><summary>Click to see the direct usage in Transformers</summary>
285
+
286
+ </details>
287
+ -->
288
+
289
+ <!--
290
+ ### Downstream Usage (Sentence Transformers)
291
+
292
+ You can finetune this model on your own dataset.
293
+
294
+ <details><summary>Click to expand</summary>
295
+
296
+ </details>
297
+ -->
298
+
299
+ <!--
300
+ ### Out-of-Scope Use
301
+
302
+ *List how the model may foreseeably be misused and address what users ought not to do with the model.*
303
+ -->
304
+
305
+ ## Evaluation
306
+
307
+ ### Metrics
308
+
309
+ #### Semantic Similarity
310
+
311
+ * Evaluated with [<code>EmbeddingSimilarityEvaluator</code>](https://sbert.net/docs/package_reference/sentence_transformer/evaluation.html#sentence_transformers.evaluation.EmbeddingSimilarityEvaluator)
312
+
313
+ | Metric | Value |
314
+ |:--------------------|:------------|
315
+ | pearson_cosine | -0.1396 |
316
+ | **spearman_cosine** | **-0.0686** |
317
+
318
+ <!--
319
+ ## Bias, Risks and Limitations
320
+
321
+ *What are the known or foreseeable issues stemming from this model? You could also flag here known failure cases or weaknesses of the model.*
322
+ -->
323
+
324
+ <!--
325
+ ### Recommendations
326
+
327
+ *What are recommendations with respect to the foreseeable issues? For example, filtering explicit content.*
328
+ -->
329
+
330
+ ## Training Details
331
+
332
+ ### Training Dataset
333
+
334
+ #### Unnamed Dataset
335
+
336
+ * Size: 95 training samples
337
+ * Columns: <code>sentence_0</code>, <code>sentence_1</code>, and <code>label</code>
338
+ * Approximate statistics based on the first 95 samples:
339
+ | | sentence_0 | sentence_1 | label |
340
+ |:--------|:-------------------------------------------------------------------------------------|:-------------------------------------------------------------------------------------|:----------------------------------------------------------------|
341
+ | type | string | string | float |
342
+ | details | <ul><li>min: 90 tokens</li><li>mean: 116.28 tokens</li><li>max: 128 tokens</li></ul> | <ul><li>min: 90 tokens</li><li>mean: 115.79 tokens</li><li>max: 128 tokens</li></ul> | <ul><li>min: 0.21</li><li>mean: 0.26</li><li>max: 0.5</li></ul> |
343
+ * Samples:
344
+ | sentence_0 | sentence_1 | label |
345
+ |:-------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------||:---------------------------------|
346
+ | <code>Design 148:<br> Description: This visual design features a clean and minimalistic layout with an emphasis on typography and balanced spacing. The dark gray background contrasts with the white text elements, providing a modern and sophisticated look. The design also includes vertical lines and a sidebar to separate different sections, adding structure without cluttering the visual flow.<br> Categories: minimalism, typography, contrast, layout design, modern aesthetics<br> Visual Characteristics: high contrast, monochromatic palette, well-defined spacing, balanced composition, structured layout</code> | <code>Design 156:<br> Description: The design uses a bold, contrasting color palette dominated by red, black, and white, highlighting a silhouetted figure against a background with traditional Japanese elements. The typography is clear and has a balance between serif and sans-serif fonts, adding to the mix of modern and traditional aesthetics. The layout is clean, with sections distinctly separated by subtle gradients, providing a sense of order and cohesiveness. The overall tone is a blend of contemporary design with cultural nuances, making it both engaging and visually striking.<br> Categories: modern design, cultural elements, typography, minimalism, contrast<br> Visual Characteristics: bold color palette, silhouette, gradients, clean layout, traditional motifs</code> | <code>0.21428571428571427</code> |
347
+ | <code>Design 135:<br> Description: This design uses an elegant and traditional aesthetic, with a muted color palette featuring cream and terracotta tones. The use of a patterned background adds texture, while the vertical layout and serif typography provide a classic and sophisticated feel. The design balances text-heavy content with organized sections, making information easily accessible, and its ornate flourishes add a touch of refinement.<br> Categories: Traditional, Elegant, Text-Heavy, Classic<br> Visual Characteristics: Muted Color Palette, Vertical Layout, Serif Typography, Textured Background, Ornate Flourishes</code> | <code>Design 194:<br> Description: This design exudes a minimalist elegance with a muted, earthy color palette and a clean layout, embodying a sense of calm and sophistication. The subtle use of textures and classic serif typography enhances the refined aesthetic, while the centered alignment and generous spacing contribute to a relaxed readability. The incorporation of a delicate floral illustration adds a touch of organic charm, making the design feel both timeless and inviting.<br> Categories: Minimalism, Elegant, Organic, Sophisticated, Classic<br> Visual Characteristics: Muted Color Palette, Serif Typography, Centered Layout, Generous Spacing, Floral Illustration</code> | <code>0.26785714285714285</code> |
348
+ | <code>Design 130:<br> Description: The visual design features a clean and structured layout with a calming color palette of beige and blue, enhancing readability and ease of navigation. The use of different font styles for headings and body text provides a clear hierarchy, while the sidebar offers easy access to additional resources and options. This design exudes professionalism, making it suitable for educational or informational purposes.<br> Categories: Informational, Educational, Professional, Web Design, User Interface<br> Visual Characteristics: Calming color palette, Structured layout, Clear typography, Sidebar navigation, Minimalist design</code> | <code>Design 215:<br> Description: The CSS Zen Garden design showcases a clean, structured layout aimed at demonstrating the possibilities of CSS styling. It uses a primarily blue and white color palette with red accents to draw attention to headings and separators. The design incorporates a formal serif and a modern sans-serif typography, creating an elegant and readable interface. The use of graphical illustrations adds visual interest and helps convey the collaborative and creative theme. The overall aesthetic balance, combined with functional elements like navigation, ensures a clear and engaging user experience.<br> Categories: Typography, User Interface, Minimalist Design, Educational, Professional, Web Design<br> Visual Characteristics: Blue and White Palette, Elegant Typography, Illustrative Graphics, Clean Layout, Contrasting Accents, Symmetry</code> | <code>0.2857142857142857</code> |
349
+ * Loss: [<code>CosineSimilarityLoss</code>](https://sbert.net/docs/package_reference/sentence_transformer/losses.html#cosinesimilarityloss) with these parameters:
350
+ ```json
351
+ {
352
+ "loss_fct": "torch.nn.modules.loss.MSELoss"
353
+ }
354
+ ```
355
+
356
+ ### Training Hyperparameters
357
+ #### Non-Default Hyperparameters
358
+
359
+ - `per_device_train_batch_size`: 16
360
+ - `per_device_eval_batch_size`: 16
361
+ - `num_train_epochs`: 1
362
+ - `multi_dataset_batch_sampler`: round_robin
363
+
364
+ #### All Hyperparameters
365
+ <details><summary>Click to expand</summary>
366
+
367
+ - `overwrite_output_dir`: False
368
+ - `do_predict`: False
369
+ - `eval_strategy`: no
370
+ - `prediction_loss_only`: True
371
+ - `per_device_train_batch_size`: 16
372
+ - `per_device_eval_batch_size`: 16
373
+ - `per_gpu_train_batch_size`: None
374
+ - `per_gpu_eval_batch_size`: None
375
+ - `gradient_accumulation_steps`: 1
376
+ - `eval_accumulation_steps`: None
377
+ - `torch_empty_cache_steps`: None
378
+ - `learning_rate`: 5e-05
379
+ - `weight_decay`: 0.0
380
+ - `adam_beta1`: 0.9
381
+ - `adam_beta2`: 0.999
382
+ - `adam_epsilon`: 1e-08
383
+ - `max_grad_norm`: 1
384
+ - `num_train_epochs`: 1
385
+ - `max_steps`: -1
386
+ - `lr_scheduler_type`: linear
387
+ - `lr_scheduler_kwargs`: {}
388
+ - `warmup_ratio`: 0.0
389
+ - `warmup_steps`: 0
390
+ - `log_level`: passive
391
+ - `log_level_replica`: warning
392
+ - `log_on_each_node`: True
393
+ - `logging_nan_inf_filter`: True
394
+ - `save_safetensors`: True
395
+ - `save_on_each_node`: False
396
+ - `save_only_model`: False
397
+ - `restore_callback_states_from_checkpoint`: False
398
+ - `no_cuda`: False
399
+ - `use_cpu`: False
400
+ - `use_mps_device`: False
401
+ - `seed`: 42
402
+ - `data_seed`: None
403
+ - `jit_mode_eval`: False
404
+ - `use_ipex`: False
405
+ - `bf16`: False
406
+ - `fp16`: False
407
+ - `fp16_opt_level`: O1
408
+ - `half_precision_backend`: auto
409
+ - `bf16_full_eval`: False
410
+ - `fp16_full_eval`: False
411
+ - `tf32`: None
412
+ - `local_rank`: 0
413
+ - `ddp_backend`: None
414
+ - `tpu_num_cores`: None
415
+ - `tpu_metrics_debug`: False
416
+ - `debug`: []
417
+ - `dataloader_drop_last`: False
418
+ - `dataloader_num_workers`: 0
419
+ - `dataloader_prefetch_factor`: None
420
+ - `past_index`: -1
421
+ - `disable_tqdm`: False
422
+ - `remove_unused_columns`: True
423
+ - `label_names`: None
424
+ - `load_best_model_at_end`: False
425
+ - `ignore_data_skip`: False
426
+ - `fsdp`: []
427
+ - `fsdp_min_num_params`: 0
428
+ - `fsdp_config`: {'min_num_params': 0, 'xla': False, 'xla_fsdp_v2': False, 'xla_fsdp_grad_ckpt': False}
429
+ - `fsdp_transformer_layer_cls_to_wrap`: None
430
+ - `accelerator_config`: {'split_batches': False, 'dispatch_batches': None, 'even_batches': True, 'use_seedable_sampler': True, 'non_blocking': False, 'gradient_accumulation_kwargs': None}
431
+ - `deepspeed`: None
432
+ - `label_smoothing_factor`: 0.0
433
+ - `optim`: adamw_torch
434
+ - `optim_args`: None
435
+ - `adafactor`: False
436
+ - `group_by_length`: False
437
+ - `length_column_name`: length
438
+ - `ddp_find_unused_parameters`: None
439
+ - `ddp_bucket_cap_mb`: None
440
+ - `ddp_broadcast_buffers`: False
441
+ - `dataloader_pin_memory`: True
442
+ - `dataloader_persistent_workers`: False
443
+ - `skip_memory_metrics`: True
444
+ - `use_legacy_prediction_loop`: False
445
+ - `push_to_hub`: False
446
+ - `resume_from_checkpoint`: None
447
+ - `hub_model_id`: None
448
+ - `hub_strategy`: every_save
449
+ - `hub_private_repo`: None
450
+ - `hub_always_push`: False
451
+ - `gradient_checkpointing`: False
452
+ - `gradient_checkpointing_kwargs`: None
453
+ - `include_inputs_for_metrics`: False
454
+ - `include_for_metrics`: []
455
+ - `eval_do_concat_batches`: True
456
+ - `fp16_backend`: auto
457
+ - `push_to_hub_model_id`: None
458
+ - `push_to_hub_organization`: None
459
+ - `mp_parameters`:
460
+ - `auto_find_batch_size`: False
461
+ - `full_determinism`: False
462
+ - `torchdynamo`: None
463
+ - `ray_scope`: last
464
+ - `ddp_timeout`: 1800
465
+ - `torch_compile`: False
466
+ - `torch_compile_backend`: None
467
+ - `torch_compile_mode`: None
468
+ - `dispatch_batches`: None
469
+ - `split_batches`: None
470
+ - `include_tokens_per_second`: False
471
+ - `include_num_input_tokens_seen`: False
472
+ - `neftune_noise_alpha`: None
473
+ - `optim_target_modules`: None
474
+ - `batch_eval_metrics`: False
475
+ - `eval_on_start`: False
476
+ - `use_liger_kernel`: False
477
+ - `eval_use_gather_object`: False
478
+ - `average_tokens_across_devices`: False
479
+ - `prompts`: None
480
+ - `batch_sampler`: batch_sampler
481
+ - `multi_dataset_batch_sampler`: round_robin
482
+
483
+ </details>
484
+
485
+ ### Training Logs
486
+ | Epoch | Step | spearman_cosine |
487
+ |:-----:|:----:|:---------------:|
488
+ | 1.0 | 6 | -0.0686 |
489
+
490
+
491
+ ### Framework Versions
492
+ - Python: 3.11.11
493
+ - Sentence Transformers: 3.4.1
494
+ - Transformers: 4.49.0
495
+ - PyTorch: 2.1.2
496
+ - Accelerate: 1.4.0
497
+ - Datasets: 3.3.2
498
+ - Tokenizers: 0.21.0
499
+
500
+ ## Citation
501
+
502
+ ### BibTeX
503
+
504
+ #### Sentence Transformers
505
+ ```bibtex
506
+ @inproceedings{reimers-2019-sentence-bert,
507
+ title = "Sentence-BERT: Sentence Embeddings using Siamese BERT-Networks",
508
+ author = "Reimers, Nils and Gurevych, Iryna",
509
+ booktitle = "Proceedings of the 2019 Conference on Empirical Methods in Natural Language Processing",
510
+ month = "11",
511
+ year = "2019",
512
+ publisher = "Association for Computational Linguistics",
513
+ url = "https://arxiv.org/abs/1908.10084",
514
+ }
515
+ ```
516
+
517
+ <!--
518
+ ## Glossary
519
+
520
+ *Clearly define terms in order to be accessible across audiences.*
521
+ -->
522
+
523
+ <!--
524
+ ## Model Card Authors
525
+
526
+ *Lists the people who create the model card, providing recognition and accountability for the detailed work that goes into its construction.*
527
+ -->
528
+
529
+ <!--
530
+ ## Model Card Contact
531
+
532
+ *Provides a way for people who have updates to the Model Card, suggestions, or questions, to contact the Model Card authors.*
533
+ -->
src/fine_tuned_design_embeddings_20250225_161918/config.json ADDED
@@ -0,0 +1,24 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "sentence-transformers/distilbert-base-nli-stsb-mean-tokens",
3
+ "activation": "gelu",
4
+ "architectures": [
5
+ "DistilBertModel"
6
+ ],
7
+ "attention_dropout": 0.1,
8
+ "dim": 768,
9
+ "dropout": 0.1,
10
+ "hidden_dim": 3072,
11
+ "initializer_range": 0.02,
12
+ "max_position_embeddings": 512,
13
+ "model_type": "distilbert",
14
+ "n_heads": 12,
15
+ "n_layers": 6,
16
+ "pad_token_id": 0,
17
+ "qa_dropout": 0.1,
18
+ "seq_classif_dropout": 0.2,
19
+ "sinusoidal_pos_embds": false,
20
+ "tie_weights_": true,
21
+ "torch_dtype": "float32",
22
+ "transformers_version": "4.49.0",
23
+ "vocab_size": 30522
24
+ }
src/fine_tuned_design_embeddings_20250225_161918/config_sentence_transformers.json ADDED
@@ -0,0 +1,10 @@
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "__version__": {
3
+ "sentence_transformers": "3.4.1",
4
+ "transformers": "4.49.0",
5
+ "pytorch": "2.1.2"
6
+ },
7
+ "prompts": {},
8
+ "default_prompt_name": null,
9
+ "similarity_fn_name": "cosine"
10
+ }
src/fine_tuned_design_embeddings_20250225_161918/eval/similarity_evaluation_results.csv ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ epoch,steps,cosine_pearson,cosine_spearman
2
+ 1.0,6,-0.13960523700017818,-0.06863870136546027
src/fine_tuned_design_embeddings_20250225_161918/modules.json ADDED
@@ -0,0 +1,14 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [
2
+ {
3
+ "idx": 0,
4
+ "name": "0",
5
+ "path": "",
6
+ "type": "sentence_transformers.models.Transformer"
7
+ },
8
+ {
9
+ "idx": 1,
10
+ "name": "1",
11
+ "path": "1_Pooling",
12
+ "type": "sentence_transformers.models.Pooling"
13
+ }
14
+ ]
src/fine_tuned_design_embeddings_20250225_161918/sentence_bert_config.json ADDED
@@ -0,0 +1,4 @@
 
 
 
 
 
1
+ {
2
+ "max_seq_length": 128,
3
+ "do_lower_case": false
4
+ }
src/fine_tuned_design_embeddings_20250225_161918/special_tokens_map.json ADDED
@@ -0,0 +1,37 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "cls_token": {
3
+ "content": "[CLS]",
4
+ "lstrip": false,
5
+ "normalized": false,
6
+ "rstrip": false,
7
+ "single_word": false
8
+ },
9
+ "mask_token": {
10
+ "content": "[MASK]",
11
+ "lstrip": false,
12
+ "normalized": false,
13
+ "rstrip": false,
14
+ "single_word": false
15
+ },
16
+ "pad_token": {
17
+ "content": "[PAD]",
18
+ "lstrip": false,
19
+ "normalized": false,
20
+ "rstrip": false,
21
+ "single_word": false
22
+ },
23
+ "sep_token": {
24
+ "content": "[SEP]",
25
+ "lstrip": false,
26
+ "normalized": false,
27
+ "rstrip": false,
28
+ "single_word": false
29
+ },
30
+ "unk_token": {
31
+ "content": "[UNK]",
32
+ "lstrip": false,
33
+ "normalized": false,
34
+ "rstrip": false,
35
+ "single_word": false
36
+ }
37
+ }
src/fine_tuned_design_embeddings_20250225_161918/tokenizer.json ADDED
The diff for this file is too large to render. See raw diff
 
src/fine_tuned_design_embeddings_20250225_161918/tokenizer_config.json ADDED
@@ -0,0 +1,59 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "added_tokens_decoder": {
3
+ "0": {
4
+ "content": "[PAD]",
5
+ "lstrip": false,
6
+ "normalized": false,
7
+ "rstrip": false,
8
+ "single_word": false,
9
+ "special": true
10
+ },
11
+ "100": {
12
+ "content": "[UNK]",
13
+ "lstrip": false,
14
+ "normalized": false,
15
+ "rstrip": false,
16
+ "single_word": false,
17
+ "special": true
18
+ },
19
+ "101": {
20
+ "content": "[CLS]",
21
+ "lstrip": false,
22
+ "normalized": false,
23
+ "rstrip": false,
24
+ "single_word": false,
25
+ "special": true
26
+ },
27
+ "102": {
28
+ "content": "[SEP]",
29
+ "lstrip": false,
30
+ "normalized": false,
31
+ "rstrip": false,
32
+ "single_word": false,
33
+ "special": true
34
+ },
35
+ "103": {
36
+ "content": "[MASK]",
37
+ "lstrip": false,
38
+ "normalized": false,
39
+ "rstrip": false,
40
+ "single_word": false,
41
+ "special": true
42
+ }
43
+ },
44
+ "clean_up_tokenization_spaces": false,
45
+ "cls_token": "[CLS]",
46
+ "do_basic_tokenize": true,
47
+ "do_lower_case": true,
48
+ "extra_special_tokens": {},
49
+ "full_tokenizer_file": null,
50
+ "mask_token": "[MASK]",
51
+ "model_max_length": 128,
52
+ "never_split": null,
53
+ "pad_token": "[PAD]",
54
+ "sep_token": "[SEP]",
55
+ "strip_accents": null,
56
+ "tokenize_chinese_chars": true,
57
+ "tokenizer_class": "DistilBertTokenizer",
58
+ "unk_token": "[UNK]"
59
+ }
src/fine_tuned_design_embeddings_20250225_161918/vocab.txt ADDED
The diff for this file is too large to render. See raw diff
 
uv.lock CHANGED
@@ -1,6 +1,24 @@
1
  version = 1
2
  requires-python = "==3.11.*"
3
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
4
  [[package]]
5
  name = "aiofiles"
6
  version = "23.2.1"
@@ -834,6 +852,7 @@ name = "imagineui"
834
  version = "0.1.0"
835
  source = { editable = "." }
836
  dependencies = [
 
837
  { name = "beautifulsoup4" },
838
  { name = "chainlit" },
839
  { name = "datasets" },
@@ -847,6 +866,7 @@ dependencies = [
847
  { name = "langgraph" },
848
  { name = "langsmith" },
849
  { name = "matplotlib" },
 
850
  { name = "notebook" },
851
  { name = "numpy" },
852
  { name = "openai" },
@@ -865,6 +885,7 @@ dependencies = [
865
 
866
  [package.metadata]
867
  requires-dist = [
 
868
  { name = "beautifulsoup4", specifier = ">=4.12.0" },
869
  { name = "chainlit", specifier = ">=0.7.700" },
870
  { name = "datasets", specifier = ">=2.17.0" },
@@ -878,6 +899,7 @@ requires-dist = [
878
  { name = "langgraph", specifier = ">=0.0.19" },
879
  { name = "langsmith", specifier = ">=0.3.11" },
880
  { name = "matplotlib", specifier = ">=3.10.0" },
 
881
  { name = "notebook" },
882
  { name = "numpy", specifier = ">=1.26.0" },
883
  { name = "openai", specifier = ">=1.63.2,<2.0.0" },
 
1
  version = 1
2
  requires-python = "==3.11.*"
3
 
4
+ [[package]]
5
+ name = "accelerate"
6
+ version = "1.4.0"
7
+ source = { registry = "https://pypi.org/simple" }
8
+ dependencies = [
9
+ { name = "huggingface-hub" },
10
+ { name = "numpy" },
11
+ { name = "packaging" },
12
+ { name = "psutil" },
13
+ { name = "pyyaml" },
14
+ { name = "safetensors" },
15
+ { name = "torch" },
16
+ ]
17
+ sdist = { url = "https://files.pythonhosted.org/packages/8f/02/24a4c4edb9cf0f1e0bc32bb6829e2138f1cc201442e7a24f0daf93b8a15a/accelerate-1.4.0.tar.gz", hash = "sha256:37d413e1b64cb8681ccd2908ae211cf73e13e6e636a2f598a96eccaa538773a5", size = 348745 }
18
+ wheels = [
19
+ { url = "https://files.pythonhosted.org/packages/0a/f6/791b9d7eb371a2f385da3b7f1769ced72ead7bf09744637ea2985c83d7ee/accelerate-1.4.0-py3-none-any.whl", hash = "sha256:f6e1e7dfaf9d799a20a1dc45efbf4b1546163eac133faa5acd0d89177c896e55", size = 342129 },
20
+ ]
21
+
22
  [[package]]
23
  name = "aiofiles"
24
  version = "23.2.1"
 
852
  version = "0.1.0"
853
  source = { editable = "." }
854
  dependencies = [
855
+ { name = "accelerate" },
856
  { name = "beautifulsoup4" },
857
  { name = "chainlit" },
858
  { name = "datasets" },
 
866
  { name = "langgraph" },
867
  { name = "langsmith" },
868
  { name = "matplotlib" },
869
+ { name = "nest-asyncio" },
870
  { name = "notebook" },
871
  { name = "numpy" },
872
  { name = "openai" },
 
885
 
886
  [package.metadata]
887
  requires-dist = [
888
+ { name = "accelerate", specifier = ">=0.26.0" },
889
  { name = "beautifulsoup4", specifier = ">=4.12.0" },
890
  { name = "chainlit", specifier = ">=0.7.700" },
891
  { name = "datasets", specifier = ">=2.17.0" },
 
899
  { name = "langgraph", specifier = ">=0.0.19" },
900
  { name = "langsmith", specifier = ">=0.3.11" },
901
  { name = "matplotlib", specifier = ">=3.10.0" },
902
+ { name = "nest-asyncio", specifier = ">=1.6.0" },
903
  { name = "notebook" },
904
  { name = "numpy", specifier = ">=1.26.0" },
905
  { name = "openai", specifier = ">=1.63.2,<2.0.0" },