| 01 | | image-text-to-text | 1.7M | 860 | | 14d |
| 02 | | image-text-to-text | 745K | 164 | | 9d |
| 03 | | image-text-to-text | 702K | 495 | | 8d |
| 04 | | image-text-to-text | 579K | 500 | | 13d |
| 05 | | — | 563K | 110 | | 13d |
| 06 | | image-text-to-text | 509K | 998 | | 9d |
| 07 | | image-text-to-text | 3.2M | 626 | | 28d |
| 08 | | image-text-to-text | 1.8M | 350 | | 28d |
| 09 | | image-text-to-text | 6.6M | 2.4K | | 49d |
| 10 | | image-text-to-text | 5.1M | 847 | | 49d |
| 11 | | image-text-to-text | 1.5M | 1.5K | | 15d |
| 12 | | image-text-to-text | 215K | 232 | | 7d |
| 13 | | image-text-to-text | 1.5M | 191 | | 15d |
| 14 | | image-text-to-text | 196K | 39 | | 7d |
| 15 | | any-to-any | 4.0M | 864 | | 58d |
| 16 | | text-generation | 174K | 3.2K | | 8d |
| 17 | | text-generation | 141K | 207 | | 11d |
| 18 | | — | 132K | 95 | | 13d |
| 19 | | any-to-any | 2.7M | 547 | | 58d |
| 20 | | image-text-to-text | 119K | 56 | | 7d |
| 21 | | image-to-text | 8.0M | 1.7K | | 90d |
| 22 | | image-text-to-text | 7.1M | 1.4K | | 62d |
| 23 | | image-text-to-text | 33K | 47 | | 6d |
| 24 | | text-generation | 97K | 852 | | 8d |
| 25 | | text-generation | 91K | 91 | | 11d |
| 26 | | text-generation | 80K | 232 | | 12d |
| 27 | | text-to-speech | 1.7M | 734 | | 31d |
| 28 | | image-to-video | 1.6M | 1.1K | | 56d |
| 29 | | text-generation | 496K | 1.1K | | 21d |
| 30 | | text-to-speech | 9.4M | 6.1K | | 490d |
| 31 | | image-text-to-text | 489K | 1.1K | | 16d |
| 32 | | image-text-to-text | 19K | 33 | | 7d |
| 33 | | token-classification | 58K | 1.1K | | 12d |
| 34 | | — | 1.2M | 1.3K | | 57d |
| 35 | | image-text-to-text | 48K | 90 | | 7d |
| 36 | | text-generation | 256K | 1.6K | | 27d |
| 37 | | image-text-to-text | 33K | 119 | | 9d |
| 38 | | image-text-to-text | 30K | 62 | | 7d |
| 39 | | text-generation | 30K | 180 | | 13d |
| 40 | | image-text-to-text | 188K | 1.4K | | 26d |
| 41 | | — | 2.7K | 154 | | 3d |
| 42 | | image-text-to-text | 27K | 30 | | 7d |
| 43 | | gguf | 7.7K | 44 | | 6d |
| 44 | | text-generation | 7.6K | 161 | | 7d |
| 45 | | image-text-to-text | 24K | 52 | | 8d |
| 46 | | image-text-to-text | 7.5K | 29 | | 7d |
| 47 | | llama.cpp | 7.2K | 68 | | 4d |
| 48 | | image-text-to-text | 20K | 40 | | 9d |
| 49 | | text-generation | 135K | 541 | | 15d |
| 50 | | text-to-image | 1.2M | 4.5K | | 155d |
| 51 | | text-generation | 4.9K | 31 | | 4d |
| 52 | | text-to-speech | 102K | 1.3K | | 27d |
| 53 | | text-generation | 14K | 51 | | 12d |
| 54 | | text-generation | 4.1K | 29 | | 6d |
| 55 | | image-text-to-text | 243K | 308 | | 44d |
| 56 | | automatic-speech-recognition | 737K | 1.1K | | 98d |
| 57 | | text-to-image | 701K | 13K | | 637d |
| 58 | | image-text-to-text | 470K | 2.8K | | 62d |
| 59 | | any-to-any | 9.8K | 138 | | 10d |
| 60 | | — | 166K | 451 | | 37d |
| 61 | | diffusion-single-file | 365K | 1.2K | | 90d |
| 62 | | text-generation | 1.5K | 46 | | 6d |
| 63 | | text-generation | 396 | 292 | | 3d |
| 64 | | text-generation | 1.1K | 63 | | 6d |
| 65 | | — | 3.0K | 184 | | 8d |
| 66 | | text-generation | 858 | 37 | | 6d |
| 67 | | text-generation | 675 | 37 | | 6d |
| 68 | | image-text-to-text | 1.8K | 36 | | 7d |
| 69 | | — | 1.5K | 240 | | 8d |
| 70 | | text-to-image | 8.5K | 587 | | 23d |
| 71 | | image-text-to-text | 1.2K | 44 | | 9d |
| 72 | | automatic-speech-recognition | 354 | 50 | | 7d |
| 73 | | text-generation | 7.7K | 184 | | 17d |
| 74 | | image-to-image | 20K | 324 | | 55d |
| 75 | | text-generation | 6.0K | 87 | | 24d |
| 76 | | image-text-to-text | 240 | 44 | | 4d |
| 77 | | text-generation | 73 | 27 | | 3d |
| 78 | | text-generation | 609 | 46 | | 8d |
| 79 | | any-to-any | 506 | 234 | | 7d |
| 80 | | image-to-3d | 3.1K | 625 | | 20d |
| 81 | | — | 117 | 38 | | 5d |
| 82 | | text-to-image | 105 | 37 | | 5d |
| 83 | | — | 29 | 76 | | 2d |
| 84 | | — | 59 | 27 | | 5d |
| 85 | | automatic-speech-recognition | 110 | 31 | | 14d |
| 86 | | image-to-image | 741 | 32 | | 26d |
| 87 | | any-to-any | 74 | 67 | | 8d |
| 88 | | text-generation | 15 | 128 | | 6d |
| 89 | | — | 227 | 85 | | 30d |
| 90 | | text-generation | 124 | 36 | | 24d |
| 91 | | text-generation | 0 | 72 | | 2d |
| 92 | | sapiens | 0 | 95 | | 6d |
| 93 | | mlx | 0 | 28 | | 6d |
| 94 | | text-to-speech | 19 | 47 | | 14d |
| 95 | | — | 0 | 150 | | 10d |
| 96 | | any-to-any | 0 | 70 | | 10d |
| 97 | | — | 0 | 50 | | 10d |
| 98 | | — | 0 | 183 | | 14d |
| 99 | | image-to-video | 0 | 434 | | 55d |
| 100 | | image-to-3d | 0 | 815 | | 150d |