From 48633c714de0b1b9179b1a03e8777c345ea0d5bb Mon Sep 17 00:00:00 2001 From: Alexander Visheratin Date: Fri, 8 Mar 2024 09:42:03 -0500 Subject: [PATCH] Add nllb-siglip-mrl. --- docs/openclip_multilingual_retrieval_results.csv | 2 ++ src/open_clip/pretrained.py | 2 ++ 2 files changed, 4 insertions(+) diff --git a/docs/openclip_multilingual_retrieval_results.csv b/docs/openclip_multilingual_retrieval_results.csv index 5055d045b..1bf4afede 100644 --- a/docs/openclip_multilingual_retrieval_results.csv +++ b/docs/openclip_multilingual_retrieval_results.csv @@ -1,4 +1,6 @@ model,version,avg,crossmodal3600 image_retrieval_recall@1 avg,crossmodal3600 image_retrieval_recall@1 ar,crossmodal3600 image_retrieval_recall@1 bn,crossmodal3600 image_retrieval_recall@1 cs,crossmodal3600 image_retrieval_recall@1 da,crossmodal3600 image_retrieval_recall@1 de,crossmodal3600 image_retrieval_recall@1 el,crossmodal3600 image_retrieval_recall@1 en,crossmodal3600 image_retrieval_recall@1 es,crossmodal3600 image_retrieval_recall@1 fa,crossmodal3600 image_retrieval_recall@1 fi,crossmodal3600 image_retrieval_recall@1 fil,crossmodal3600 image_retrieval_recall@1 fr,crossmodal3600 image_retrieval_recall@1 he,crossmodal3600 image_retrieval_recall@1 hi,crossmodal3600 image_retrieval_recall@1 hr,crossmodal3600 image_retrieval_recall@1 hu,crossmodal3600 image_retrieval_recall@1 id,crossmodal3600 image_retrieval_recall@1 it,crossmodal3600 image_retrieval_recall@1 ja,crossmodal3600 image_retrieval_recall@1 ko,crossmodal3600 image_retrieval_recall@1 mi,crossmodal3600 image_retrieval_recall@1 nl,crossmodal3600 image_retrieval_recall@1 no,crossmodal3600 image_retrieval_recall@1 pl,crossmodal3600 image_retrieval_recall@1 pt,crossmodal3600 image_retrieval_recall@1 quz,crossmodal3600 image_retrieval_recall@1 ro,crossmodal3600 image_retrieval_recall@1 ru,crossmodal3600 image_retrieval_recall@1 sv,crossmodal3600 image_retrieval_recall@1 sw,crossmodal3600 image_retrieval_recall@1 te,crossmodal3600 image_retrieval_recall@1 th,crossmodal3600 image_retrieval_recall@1 tr,crossmodal3600 image_retrieval_recall@1 uk,crossmodal3600 image_retrieval_recall@1 vi,crossmodal3600 image_retrieval_recall@1 zh,crossmodal3600 image_retrieval_recall@10 avg,crossmodal3600 image_retrieval_recall@10 ar,crossmodal3600 image_retrieval_recall@10 bn,crossmodal3600 image_retrieval_recall@10 cs,crossmodal3600 image_retrieval_recall@10 da,crossmodal3600 image_retrieval_recall@10 de,crossmodal3600 image_retrieval_recall@10 el,crossmodal3600 image_retrieval_recall@10 en,crossmodal3600 image_retrieval_recall@10 es,crossmodal3600 image_retrieval_recall@10 fa,crossmodal3600 image_retrieval_recall@10 fi,crossmodal3600 image_retrieval_recall@10 fil,crossmodal3600 image_retrieval_recall@10 fr,crossmodal3600 image_retrieval_recall@10 he,crossmodal3600 image_retrieval_recall@10 hi,crossmodal3600 image_retrieval_recall@10 hr,crossmodal3600 image_retrieval_recall@10 hu,crossmodal3600 image_retrieval_recall@10 id,crossmodal3600 image_retrieval_recall@10 it,crossmodal3600 image_retrieval_recall@10 ja,crossmodal3600 image_retrieval_recall@10 ko,crossmodal3600 image_retrieval_recall@10 mi,crossmodal3600 image_retrieval_recall@10 nl,crossmodal3600 image_retrieval_recall@10 no,crossmodal3600 image_retrieval_recall@10 pl,crossmodal3600 image_retrieval_recall@10 pt,crossmodal3600 image_retrieval_recall@10 quz,crossmodal3600 image_retrieval_recall@10 ro,crossmodal3600 image_retrieval_recall@10 ru,crossmodal3600 image_retrieval_recall@10 sv,crossmodal3600 image_retrieval_recall@10 sw,crossmodal3600 image_retrieval_recall@10 te,crossmodal3600 image_retrieval_recall@10 th,crossmodal3600 image_retrieval_recall@10 tr,crossmodal3600 image_retrieval_recall@10 uk,crossmodal3600 image_retrieval_recall@10 vi,crossmodal3600 image_retrieval_recall@10 zh,crossmodal3600 image_retrieval_recall@5 avg,crossmodal3600 image_retrieval_recall@5 ar,crossmodal3600 image_retrieval_recall@5 bn,crossmodal3600 image_retrieval_recall@5 cs,crossmodal3600 image_retrieval_recall@5 da,crossmodal3600 image_retrieval_recall@5 de,crossmodal3600 image_retrieval_recall@5 el,crossmodal3600 image_retrieval_recall@5 en,crossmodal3600 image_retrieval_recall@5 es,crossmodal3600 image_retrieval_recall@5 fa,crossmodal3600 image_retrieval_recall@5 fi,crossmodal3600 image_retrieval_recall@5 fil,crossmodal3600 image_retrieval_recall@5 fr,crossmodal3600 image_retrieval_recall@5 he,crossmodal3600 image_retrieval_recall@5 hi,crossmodal3600 image_retrieval_recall@5 hr,crossmodal3600 image_retrieval_recall@5 hu,crossmodal3600 image_retrieval_recall@5 id,crossmodal3600 image_retrieval_recall@5 it,crossmodal3600 image_retrieval_recall@5 ja,crossmodal3600 image_retrieval_recall@5 ko,crossmodal3600 image_retrieval_recall@5 mi,crossmodal3600 image_retrieval_recall@5 nl,crossmodal3600 image_retrieval_recall@5 no,crossmodal3600 image_retrieval_recall@5 pl,crossmodal3600 image_retrieval_recall@5 pt,crossmodal3600 image_retrieval_recall@5 quz,crossmodal3600 image_retrieval_recall@5 ro,crossmodal3600 image_retrieval_recall@5 ru,crossmodal3600 image_retrieval_recall@5 sv,crossmodal3600 image_retrieval_recall@5 sw,crossmodal3600 image_retrieval_recall@5 te,crossmodal3600 image_retrieval_recall@5 th,crossmodal3600 image_retrieval_recall@5 tr,crossmodal3600 image_retrieval_recall@5 uk,crossmodal3600 image_retrieval_recall@5 vi,crossmodal3600 image_retrieval_recall@5 zh,crossmodal3600 text_retrieval_recall@1 avg,crossmodal3600 text_retrieval_recall@1 ar,crossmodal3600 text_retrieval_recall@1 bn,crossmodal3600 text_retrieval_recall@1 cs,crossmodal3600 text_retrieval_recall@1 da,crossmodal3600 text_retrieval_recall@1 de,crossmodal3600 text_retrieval_recall@1 el,crossmodal3600 text_retrieval_recall@1 en,crossmodal3600 text_retrieval_recall@1 es,crossmodal3600 text_retrieval_recall@1 fa,crossmodal3600 text_retrieval_recall@1 fi,crossmodal3600 text_retrieval_recall@1 fil,crossmodal3600 text_retrieval_recall@1 fr,crossmodal3600 text_retrieval_recall@1 he,crossmodal3600 text_retrieval_recall@1 hi,crossmodal3600 text_retrieval_recall@1 hr,crossmodal3600 text_retrieval_recall@1 hu,crossmodal3600 text_retrieval_recall@1 id,crossmodal3600 text_retrieval_recall@1 it,crossmodal3600 text_retrieval_recall@1 ja,crossmodal3600 text_retrieval_recall@1 ko,crossmodal3600 text_retrieval_recall@1 mi,crossmodal3600 text_retrieval_recall@1 nl,crossmodal3600 text_retrieval_recall@1 no,crossmodal3600 text_retrieval_recall@1 pl,crossmodal3600 text_retrieval_recall@1 pt,crossmodal3600 text_retrieval_recall@1 quz,crossmodal3600 text_retrieval_recall@1 ro,crossmodal3600 text_retrieval_recall@1 ru,crossmodal3600 text_retrieval_recall@1 sv,crossmodal3600 text_retrieval_recall@1 sw,crossmodal3600 text_retrieval_recall@1 te,crossmodal3600 text_retrieval_recall@1 th,crossmodal3600 text_retrieval_recall@1 tr,crossmodal3600 text_retrieval_recall@1 uk,crossmodal3600 text_retrieval_recall@1 vi,crossmodal3600 text_retrieval_recall@1 zh,crossmodal3600 text_retrieval_recall@10 avg,crossmodal3600 text_retrieval_recall@10 ar,crossmodal3600 text_retrieval_recall@10 bn,crossmodal3600 text_retrieval_recall@10 cs,crossmodal3600 text_retrieval_recall@10 da,crossmodal3600 text_retrieval_recall@10 de,crossmodal3600 text_retrieval_recall@10 el,crossmodal3600 text_retrieval_recall@10 en,crossmodal3600 text_retrieval_recall@10 es,crossmodal3600 text_retrieval_recall@10 fa,crossmodal3600 text_retrieval_recall@10 fi,crossmodal3600 text_retrieval_recall@10 fil,crossmodal3600 text_retrieval_recall@10 fr,crossmodal3600 text_retrieval_recall@10 he,crossmodal3600 text_retrieval_recall@10 hi,crossmodal3600 text_retrieval_recall@10 hr,crossmodal3600 text_retrieval_recall@10 hu,crossmodal3600 text_retrieval_recall@10 id,crossmodal3600 text_retrieval_recall@10 it,crossmodal3600 text_retrieval_recall@10 ja,crossmodal3600 text_retrieval_recall@10 ko,crossmodal3600 text_retrieval_recall@10 mi,crossmodal3600 text_retrieval_recall@10 nl,crossmodal3600 text_retrieval_recall@10 no,crossmodal3600 text_retrieval_recall@10 pl,crossmodal3600 text_retrieval_recall@10 pt,crossmodal3600 text_retrieval_recall@10 quz,crossmodal3600 text_retrieval_recall@10 ro,crossmodal3600 text_retrieval_recall@10 ru,crossmodal3600 text_retrieval_recall@10 sv,crossmodal3600 text_retrieval_recall@10 sw,crossmodal3600 text_retrieval_recall@10 te,crossmodal3600 text_retrieval_recall@10 th,crossmodal3600 text_retrieval_recall@10 tr,crossmodal3600 text_retrieval_recall@10 uk,crossmodal3600 text_retrieval_recall@10 vi,crossmodal3600 text_retrieval_recall@10 zh,crossmodal3600 text_retrieval_recall@5 avg,crossmodal3600 text_retrieval_recall@5 ar,crossmodal3600 text_retrieval_recall@5 bn,crossmodal3600 text_retrieval_recall@5 cs,crossmodal3600 text_retrieval_recall@5 da,crossmodal3600 text_retrieval_recall@5 de,crossmodal3600 text_retrieval_recall@5 el,crossmodal3600 text_retrieval_recall@5 en,crossmodal3600 text_retrieval_recall@5 es,crossmodal3600 text_retrieval_recall@5 fa,crossmodal3600 text_retrieval_recall@5 fi,crossmodal3600 text_retrieval_recall@5 fil,crossmodal3600 text_retrieval_recall@5 fr,crossmodal3600 text_retrieval_recall@5 he,crossmodal3600 text_retrieval_recall@5 hi,crossmodal3600 text_retrieval_recall@5 hr,crossmodal3600 text_retrieval_recall@5 hu,crossmodal3600 text_retrieval_recall@5 id,crossmodal3600 text_retrieval_recall@5 it,crossmodal3600 text_retrieval_recall@5 ja,crossmodal3600 text_retrieval_recall@5 ko,crossmodal3600 text_retrieval_recall@5 mi,crossmodal3600 text_retrieval_recall@5 nl,crossmodal3600 text_retrieval_recall@5 no,crossmodal3600 text_retrieval_recall@5 pl,crossmodal3600 text_retrieval_recall@5 pt,crossmodal3600 text_retrieval_recall@5 quz,crossmodal3600 text_retrieval_recall@5 ro,crossmodal3600 text_retrieval_recall@5 ru,crossmodal3600 text_retrieval_recall@5 sv,crossmodal3600 text_retrieval_recall@5 sw,crossmodal3600 text_retrieval_recall@5 te,crossmodal3600 text_retrieval_recall@5 th,crossmodal3600 text_retrieval_recall@5 tr,crossmodal3600 text_retrieval_recall@5 uk,crossmodal3600 text_retrieval_recall@5 vi,crossmodal3600 text_retrieval_recall@5 zh,multilingual_mscoco_captions image_retrieval_recall@1 avg,multilingual_mscoco_captions image_retrieval_recall@1 de,multilingual_mscoco_captions image_retrieval_recall@1 en,multilingual_mscoco_captions image_retrieval_recall@1 es,multilingual_mscoco_captions image_retrieval_recall@1 fr,multilingual_mscoco_captions image_retrieval_recall@1 it,multilingual_mscoco_captions image_retrieval_recall@1 jp,multilingual_mscoco_captions image_retrieval_recall@1 ko,multilingual_mscoco_captions image_retrieval_recall@1 pl,multilingual_mscoco_captions image_retrieval_recall@1 ru,multilingual_mscoco_captions image_retrieval_recall@1 tr,multilingual_mscoco_captions image_retrieval_recall@1 zh,multilingual_mscoco_captions image_retrieval_recall@10 avg,multilingual_mscoco_captions image_retrieval_recall@10 de,multilingual_mscoco_captions image_retrieval_recall@10 en,multilingual_mscoco_captions image_retrieval_recall@10 es,multilingual_mscoco_captions image_retrieval_recall@10 fr,multilingual_mscoco_captions image_retrieval_recall@10 it,multilingual_mscoco_captions image_retrieval_recall@10 jp,multilingual_mscoco_captions image_retrieval_recall@10 ko,multilingual_mscoco_captions image_retrieval_recall@10 pl,multilingual_mscoco_captions image_retrieval_recall@10 ru,multilingual_mscoco_captions image_retrieval_recall@10 tr,multilingual_mscoco_captions image_retrieval_recall@10 zh,multilingual_mscoco_captions image_retrieval_recall@5 avg,multilingual_mscoco_captions image_retrieval_recall@5 de,multilingual_mscoco_captions image_retrieval_recall@5 en,multilingual_mscoco_captions image_retrieval_recall@5 es,multilingual_mscoco_captions image_retrieval_recall@5 fr,multilingual_mscoco_captions image_retrieval_recall@5 it,multilingual_mscoco_captions image_retrieval_recall@5 jp,multilingual_mscoco_captions image_retrieval_recall@5 ko,multilingual_mscoco_captions image_retrieval_recall@5 pl,multilingual_mscoco_captions image_retrieval_recall@5 ru,multilingual_mscoco_captions image_retrieval_recall@5 tr,multilingual_mscoco_captions image_retrieval_recall@5 zh,multilingual_mscoco_captions text_retrieval_recall@1 avg,multilingual_mscoco_captions text_retrieval_recall@1 de,multilingual_mscoco_captions text_retrieval_recall@1 en,multilingual_mscoco_captions text_retrieval_recall@1 es,multilingual_mscoco_captions text_retrieval_recall@1 fr,multilingual_mscoco_captions text_retrieval_recall@1 it,multilingual_mscoco_captions text_retrieval_recall@1 jp,multilingual_mscoco_captions text_retrieval_recall@1 ko,multilingual_mscoco_captions text_retrieval_recall@1 pl,multilingual_mscoco_captions text_retrieval_recall@1 ru,multilingual_mscoco_captions text_retrieval_recall@1 tr,multilingual_mscoco_captions text_retrieval_recall@1 zh,multilingual_mscoco_captions text_retrieval_recall@10 avg,multilingual_mscoco_captions text_retrieval_recall@10 de,multilingual_mscoco_captions text_retrieval_recall@10 en,multilingual_mscoco_captions text_retrieval_recall@10 es,multilingual_mscoco_captions text_retrieval_recall@10 fr,multilingual_mscoco_captions text_retrieval_recall@10 it,multilingual_mscoco_captions text_retrieval_recall@10 jp,multilingual_mscoco_captions text_retrieval_recall@10 ko,multilingual_mscoco_captions text_retrieval_recall@10 pl,multilingual_mscoco_captions text_retrieval_recall@10 ru,multilingual_mscoco_captions text_retrieval_recall@10 tr,multilingual_mscoco_captions text_retrieval_recall@10 zh,multilingual_mscoco_captions text_retrieval_recall@5 avg,multilingual_mscoco_captions text_retrieval_recall@5 de,multilingual_mscoco_captions text_retrieval_recall@5 en,multilingual_mscoco_captions text_retrieval_recall@5 es,multilingual_mscoco_captions text_retrieval_recall@5 fr,multilingual_mscoco_captions text_retrieval_recall@5 it,multilingual_mscoco_captions text_retrieval_recall@5 jp,multilingual_mscoco_captions text_retrieval_recall@5 ko,multilingual_mscoco_captions text_retrieval_recall@5 pl,multilingual_mscoco_captions text_retrieval_recall@5 ru,multilingual_mscoco_captions text_retrieval_recall@5 tr,multilingual_mscoco_captions text_retrieval_recall@5 zh +nllb-clip-large-siglip,mrl,0.784,0.6079,0.5836,0.5728,0.5289,0.7269,0.7569,0.5653,0.5211,0.6386,0.6131,0.6867,0.4719,0.7153,0.7322,0.42,0.7419,0.7078,0.6958,0.7019,0.7003,0.5942,0.2919,0.6133,0.6525,0.635,0.6208,0.2239,0.7575,0.6886,0.5919,0.4975,0.4233,0.6233,0.6442,0.6797,0.6725,0.595,0.8922,0.9047,0.8842,0.8817,0.9608,0.9681,0.8725,0.8622,0.9269,0.9144,0.9436,0.8167,0.9564,0.9572,0.7692,0.9586,0.95,0.9494,0.9514,0.9414,0.8911,0.6289,0.9147,0.9186,0.9097,0.9197,0.5003,0.9694,0.9483,0.8953,0.8344,0.8019,0.9208,0.9236,0.9408,0.9433,0.89,0.8333,0.8308,0.8172,0.8017,0.9183,0.9306,0.7997,0.7878,0.8758,0.8578,0.8978,0.7378,0.9167,0.9239,0.6717,0.9242,0.9097,0.9058,0.9072,0.8997,0.8306,0.5317,0.8544,0.87,0.8547,0.8592,0.4183,0.9381,0.9047,0.8267,0.7533,0.7042,0.8558,0.8672,0.8958,0.8956,0.825,0.5741,0.5447,0.5608,0.4931,0.6961,0.7119,0.5253,0.4969,0.5992,0.5722,0.6494,0.4394,0.6803,0.7053,0.4311,0.7014,0.6753,0.6611,0.6517,0.6714,0.5589,0.2733,0.5675,0.6108,0.5856,0.5742,0.2267,0.7183,0.6453,0.5528,0.4708,0.395,0.5869,0.5989,0.6544,0.6286,0.5544,0.8816,0.8828,0.8847,0.8647,0.9464,0.9561,0.8506,0.855,0.9167,0.8978,0.9356,0.7925,0.9478,0.955,0.7864,0.955,0.9422,0.9431,0.9442,0.9356,0.8806,0.6189,0.8981,0.9167,0.8981,0.8967,0.4878,0.9703,0.9347,0.8783,0.8206,0.7856,0.9039,0.9139,0.9344,0.9342,0.8728,0.8174,0.8078,0.8186,0.7778,0.9025,0.9136,0.7783,0.7731,0.8531,0.8242,0.8822,0.7033,0.9011,0.9103,0.6925,0.9156,0.8944,0.8919,0.8917,0.8908,0.8125,0.5094,0.8317,0.8583,0.8397,0.8342,0.4033,0.9336,0.8881,0.8069,0.7364,0.6814,0.8383,0.8506,0.8847,0.8831,0.8097,0.6997,0.717,0.748,0.721,0.72,0.71,0.604,0.667,0.737,0.667,0.717,0.689,0.9503,0.952,0.968,0.958,0.948,0.964,0.905,0.954,0.962,0.931,0.964,0.947,0.8988,0.903,0.928,0.905,0.907,0.913,0.844,0.895,0.911,0.86,0.919,0.902,0.6433,0.661,0.696,0.659,0.661,0.661,0.554,0.611,0.686,0.609,0.645,0.633,0.9449,0.951,0.972,0.964,0.94,0.962,0.885,0.937,0.961,0.911,0.963,0.948,0.8848,0.894,0.919,0.902,0.896,0.903,0.807,0.868,0.906,0.841,0.907,0.89 +nllb-clip-base-siglip,mrl,0.7493,0.5539,0.5358,0.5439,0.4783,0.6817,0.6933,0.4894,0.4914,0.5833,0.5572,0.6192,0.4056,0.6667,0.68,0.3842,0.6647,0.6306,0.6489,0.6411,0.6461,0.5411,0.2436,0.5767,0.5894,0.5761,0.5583,0.1864,0.6819,0.6331,0.5375,0.4517,0.3839,0.5658,0.5964,0.6264,0.6147,0.5353,0.8643,0.8819,0.8733,0.8533,0.9439,0.9439,0.8331,0.8392,0.9025,0.8858,0.9128,0.76,0.9333,0.9417,0.7389,0.9389,0.9139,0.9292,0.9314,0.9228,0.8614,0.5658,0.8853,0.8994,0.8739,0.8839,0.4497,0.9511,0.9192,0.8725,0.8097,0.7753,0.8936,0.9011,0.915,0.9181,0.8589,0.7963,0.8033,0.7956,0.7633,0.8992,0.9011,0.7517,0.7589,0.8306,0.8178,0.8497,0.6708,0.8878,0.8933,0.6372,0.8856,0.8658,0.8803,0.8683,0.8703,0.7933,0.4744,0.8167,0.8408,0.81,0.8167,0.3653,0.9017,0.8608,0.7925,0.7211,0.6622,0.8239,0.8453,0.8583,0.8606,0.7922,0.5232,0.4983,0.5306,0.4467,0.6419,0.66,0.4658,0.47,0.5575,0.5158,0.5797,0.3883,0.6361,0.6328,0.3931,0.6294,0.5844,0.6142,0.5964,0.6103,0.5111,0.2353,0.5297,0.5581,0.5258,0.5222,0.1917,0.6444,0.5939,0.4997,0.4267,0.3658,0.5508,0.5653,0.5928,0.5783,0.4939,0.8558,0.8625,0.8756,0.8389,0.9361,0.9378,0.815,0.8314,0.8956,0.8647,0.9031,0.7522,0.9356,0.9336,0.76,0.9319,0.9061,0.9197,0.9242,0.9233,0.86,0.5511,0.8772,0.8914,0.8672,0.8697,0.4436,0.9483,0.9111,0.8531,0.7936,0.7589,0.8856,0.8906,0.9033,0.9119,0.8444,0.7792,0.7781,0.8014,0.7383,0.8872,0.885,0.7314,0.7439,0.8186,0.7839,0.8381,0.6489,0.8758,0.8803,0.6686,0.8739,0.8414,0.8583,0.8539,0.8553,0.7764,0.4567,0.8003,0.8233,0.7947,0.7933,0.3542,0.8953,0.8417,0.7608,0.6892,0.6411,0.8119,0.8197,0.8422,0.84,0.7494,0.6559,0.676,0.719,0.68,0.689,0.677,0.565,0.624,0.677,0.613,0.668,0.627,0.9458,0.95,0.966,0.96,0.955,0.962,0.894,0.94,0.96,0.909,0.963,0.945,0.8846,0.901,0.92,0.899,0.896,0.898,0.814,0.867,0.904,0.85,0.901,0.881,0.6106,0.625,0.668,0.629,0.631,0.63,0.513,0.587,0.636,0.588,0.616,0.594,0.9379,0.939,0.963,0.955,0.942,0.955,0.881,0.924,0.953,0.91,0.957,0.938,0.8643,0.871,0.904,0.881,0.875,0.893,0.798,0.843,0.882,0.827,0.886,0.847 nllb-clip-large-siglip,v1,0.7391,0.5456,0.5203,0.4908,0.4636,0.6558,0.6869,0.5128,0.4583,0.5789,0.5356,0.6192,0.4303,0.6483,0.6564,0.3511,0.6639,0.6458,0.6375,0.6183,0.6261,0.5442,0.26,0.5642,0.5767,0.5961,0.5767,0.1919,0.6881,0.6272,0.5442,0.4317,0.3733,0.5569,0.5767,0.6158,0.5967,0.5206,0.8605,0.8647,0.825,0.8436,0.9303,0.9397,0.8556,0.8194,0.8961,0.8775,0.9172,0.7878,0.9331,0.9311,0.7019,0.9378,0.9275,0.9186,0.9161,0.9144,0.8631,0.5908,0.8939,0.8967,0.8894,0.8978,0.4731,0.9442,0.9256,0.8719,0.7939,0.745,0.8811,0.9011,0.9133,0.9139,0.8444,0.7913,0.7892,0.7519,0.7567,0.8714,0.8956,0.7783,0.7311,0.8264,0.8039,0.8642,0.6986,0.8786,0.8786,0.6031,0.8869,0.8789,0.8631,0.8594,0.8606,0.7875,0.4897,0.8169,0.8269,0.8272,0.8269,0.3903,0.9003,0.8644,0.7933,0.7094,0.6542,0.8114,0.8347,0.8544,0.8556,0.7656,0.5053,0.4789,0.4878,0.4311,0.6169,0.6364,0.4772,0.4353,0.5381,0.4925,0.5697,0.3828,0.615,0.6064,0.36,0.6206,0.5869,0.5975,0.5647,0.5753,0.4922,0.2322,0.5164,0.5428,0.5406,0.5236,0.1853,0.6283,0.5875,0.4906,0.3903,0.3367,0.5144,0.5464,0.5697,0.5506,0.4711,0.8457,0.8392,0.8306,0.8253,0.9236,0.9278,0.8222,0.8119,0.8822,0.8533,0.9111,0.7567,0.9281,0.9161,0.7125,0.9269,0.9142,0.9114,0.9014,0.8978,0.8514,0.5689,0.8714,0.8856,0.8739,0.8747,0.4494,0.9411,0.9086,0.8494,0.7764,0.7203,0.8733,0.8794,0.9017,0.9031,0.8236,0.7691,0.7586,0.7558,0.7297,0.8653,0.875,0.7481,0.7081,0.8119,0.7639,0.8425,0.6594,0.8664,0.8567,0.6189,0.8692,0.8528,0.8433,0.835,0.8403,0.7675,0.4608,0.7928,0.8208,0.7958,0.7939,0.3633,0.8883,0.8464,0.7658,0.6769,0.6125,0.7956,0.8036,0.8322,0.8314,0.7383,0.6499,0.667,0.699,0.665,0.661,0.674,0.571,0.633,0.679,0.606,0.672,0.622,0.9395,0.942,0.965,0.946,0.94,0.956,0.884,0.936,0.953,0.915,0.952,0.945,0.8699,0.883,0.894,0.882,0.877,0.893,0.809,0.852,0.894,0.834,0.883,0.868,0.5847,0.589,0.628,0.605,0.604,0.599,0.506,0.537,0.615,0.57,0.607,0.572,0.9266,0.931,0.958,0.939,0.921,0.952,0.867,0.918,0.945,0.892,0.938,0.932,0.8472,0.844,0.883,0.858,0.863,0.867,0.782,0.832,0.868,0.809,0.871,0.842 nllb-clip-base-siglip,v1,0.7103,0.5067,0.5022,0.4844,0.4311,0.6344,0.6442,0.4508,0.4489,0.5383,0.5061,0.5625,0.37,0.61,0.6144,0.3258,0.6247,0.5831,0.5981,0.5775,0.595,0.5028,0.2183,0.5194,0.5297,0.5397,0.5133,0.1642,0.6203,0.59,0.5006,0.4028,0.3425,0.5278,0.5483,0.5658,0.5669,0.4883,0.8353,0.8556,0.8264,0.8122,0.9217,0.9236,0.8108,0.8078,0.8728,0.8478,0.8844,0.7339,0.9144,0.9033,0.6858,0.915,0.8892,0.9047,0.9008,0.8925,0.8397,0.5386,0.8683,0.8672,0.8528,0.8703,0.4283,0.9178,0.9025,0.8419,0.7706,0.7286,0.8583,0.8844,0.8819,0.8919,0.8239,0.7598,0.7694,0.7419,0.7181,0.8664,0.8725,0.7197,0.7222,0.7997,0.7669,0.8144,0.6481,0.8558,0.8394,0.5808,0.8625,0.8278,0.8417,0.8267,0.8314,0.7547,0.435,0.7886,0.7997,0.7861,0.7944,0.3458,0.8617,0.8378,0.7617,0.6711,0.6214,0.7883,0.81,0.8189,0.8256,0.7464,0.467,0.4492,0.4606,0.3964,0.5956,0.6,0.4239,0.4153,0.4931,0.4575,0.5103,0.3531,0.5711,0.5472,0.3369,0.5739,0.5264,0.5539,0.5189,0.5481,0.4736,0.1956,0.4756,0.4947,0.4831,0.4831,0.1622,0.5572,0.5353,0.4583,0.3814,0.3203,0.4844,0.5031,0.5203,0.5211,0.4311,0.8171,0.8281,0.8317,0.7933,0.9117,0.9106,0.7808,0.7864,0.8547,0.8194,0.8597,0.7133,0.8997,0.8864,0.7056,0.9056,0.8775,0.8892,0.8797,0.8875,0.8275,0.5083,0.8361,0.8603,0.8336,0.8397,0.4131,0.9036,0.8794,0.8194,0.745,0.6914,0.8469,0.8589,0.8592,0.8806,0.7931,0.7317,0.7369,0.7361,0.6833,0.8469,0.8444,0.6889,0.6908,0.77,0.7286,0.7875,0.6119,0.8364,0.8114,0.5983,0.845,0.8011,0.8189,0.7864,0.8114,0.7417,0.4056,0.7433,0.7703,0.7539,0.7489,0.3325,0.8358,0.8061,0.7231,0.6406,0.5758,0.7628,0.7769,0.7867,0.8003,0.7022,0.6258,0.629,0.684,0.652,0.648,0.643,0.546,0.6,0.654,0.607,0.637,0.584,0.9275,0.935,0.952,0.939,0.935,0.944,0.878,0.922,0.944,0.886,0.943,0.924,0.8574,0.87,0.888,0.867,0.869,0.878,0.808,0.836,0.876,0.824,0.868,0.847,0.5701,0.588,0.624,0.574,0.582,0.591,0.494,0.548,0.58,0.553,0.59,0.547,0.9135,0.916,0.939,0.936,0.92,0.936,0.846,0.899,0.926,0.883,0.931,0.917,0.8384,0.843,0.875,0.852,0.844,0.856,0.766,0.826,0.866,0.812,0.854,0.828 xlm-roberta-large-ViT-H-14,frozen_laion5b_s13b_b90k,0.7062,0.5022,0.4606,0.0542,0.4608,0.6678,0.7328,0.5222,0.5133,0.6219,0.5639,0.5711,0.0997,0.6853,0.6406,0.215,0.6547,0.6494,0.6431,0.6642,0.7261,0.5156,0.0044,0.5606,0.5561,0.6308,0.615,0.0361,0.7008,0.7022,0.5394,0.0267,0.0064,0.5433,0.5881,0.6703,0.6475,0.5906,0.7599,0.8122,0.1856,0.8228,0.9358,0.9594,0.8442,0.8514,0.9203,0.8783,0.88,0.2417,0.9444,0.9181,0.5228,0.9275,0.9272,0.9192,0.9364,0.96,0.8511,0.0183,0.8875,0.8883,0.9094,0.9103,0.1106,0.9494,0.9511,0.8589,0.0683,0.0283,0.8769,0.8997,0.9378,0.9303,0.8933,0.7049,0.7225,0.1297,0.7406,0.8953,0.9242,0.7728,0.7783,0.8633,0.8047,0.8142,0.1958,0.9047,0.8642,0.4183,0.8758,0.8758,0.8658,0.8892,0.9225,0.7681,0.0139,0.8208,0.8183,0.8533,0.8483,0.0842,0.9114,0.9128,0.7867,0.0567,0.0175,0.8011,0.8292,0.8878,0.8783,0.8317,0.5338,0.4867,0.1206,0.4989,0.7306,0.7694,0.5608,0.5267,0.62,0.6028,0.6206,0.1344,0.71,0.6822,0.2783,0.7061,0.6658,0.6756,0.6936,0.7556,0.5611,0.0097,0.5533,0.6272,0.645,0.6147,0.0542,0.7436,0.6994,0.5864,0.0442,0.0144,0.5867,0.5992,0.7078,0.6986,0.6322,0.7891,0.8478,0.3214,0.87,0.9611,0.975,0.8808,0.8697,0.9294,0.9056,0.9175,0.2861,0.9617,0.9372,0.6089,0.9492,0.9447,0.9428,0.9542,0.9719,0.8875,0.0261,0.8894,0.9219,0.9306,0.92,0.1517,0.9714,0.9564,0.8947,0.0953,0.0625,0.9094,0.9189,0.9594,0.9572,0.9206,0.7372,0.7622,0.2508,0.7811,0.9233,0.9483,0.8117,0.7892,0.87,0.8417,0.8544,0.2436,0.9172,0.8878,0.5169,0.9139,0.8872,0.895,0.9114,0.9444,0.8136,0.0211,0.8158,0.8692,0.8778,0.8625,0.1214,0.9394,0.915,0.8347,0.0767,0.0411,0.8458,0.8553,0.9161,0.9172,0.8669,0.6456,0.648,0.736,0.659,0.646,0.649,0.643,0.565,0.686,0.624,0.627,0.619,0.9324,0.935,0.951,0.947,0.927,0.948,0.923,0.903,0.948,0.916,0.924,0.934,0.8714,0.874,0.908,0.891,0.867,0.879,0.862,0.832,0.895,0.854,0.866,0.857,0.6445,0.655,0.715,0.682,0.643,0.664,0.623,0.528,0.68,0.627,0.635,0.637,0.9482,0.952,0.973,0.96,0.945,0.96,0.94,0.902,0.964,0.939,0.948,0.947,0.8835,0.896,0.924,0.899,0.885,0.897,0.871,0.813,0.913,0.859,0.878,0.884 diff --git a/src/open_clip/pretrained.py b/src/open_clip/pretrained.py index e7cd74fe1..e43e773fd 100644 --- a/src/open_clip/pretrained.py +++ b/src/open_clip/pretrained.py @@ -433,9 +433,11 @@ def _apcfg(url='', hf_hub='', **kwargs): "nllb-clip-base-siglip": dict( v1=_slpcfg(hf_hub='visheratin/nllb-clip-base-siglip/'), + mrl=_slpcfg(hf_hub='visheratin/nllb-siglip-mrl-base/'), ), "nllb-clip-large-siglip": dict( v1=_slpcfg(hf_hub='visheratin/nllb-clip-large-siglip/'), + mrl=_slpcfg(hf_hub='visheratin/nllb-siglip-mrl-large/'), ) }