Azuremis
/

mlx7-two-tower-retrieval

Model card Files Files and versions

Azuremis commited on Apr 25

Commit

cb576c3

·

verified ·

1 Parent(s): 061a3c2

Upload Two-Tower model

Files changed (2) hide show

best_model.pt +3 -0
config.yml +31 -0

best_model.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:4bb9033e31ac60f65170f8a07e935b2f36f010b9730638a6f7c51d451f0ebb3b
+size 566119

config.yml ADDED Viewed

	@@ -0,0 +1,31 @@

+batch_size: 256
+checkpoint_dir: checkpoints
+data: data/processed/classic_triplets.parquet
+device: cpu
+embedding:
+  embedding_dim: 64
+  type: lookup
+encoder:
+  arch: mean
+  hidden_dim: 128
+  tied_weights: true
+epochs: 3
+huggingface:
+  private: false
+  push_to_hub: true
+  repo_id: mlx7-two-tower-retrieval
+learning_rate: 1e-3
+loss:
+  margin: 0.2
+  type: triplet
+max_sequence_length: 64
+optimizer:
+  lr: 0.001
+  type: adamw
+tokeniser:
+  max_len: 64
+  type: char
+use_wandb: true
+wandb:
+  entity: azuremis
+  project: two-tower-retrieval