Add new SentenceTransformer model
Browse files- .gitattributes +1 -0
- 1_Pooling/config.json +10 -0
- README.md +501 -0
- config.json +28 -0
- config_sentence_transformers.json +10 -0
- model.safetensors +3 -0
- modules.json +14 -0
- sentence_bert_config.json +4 -0
- sentencepiece.bpe.model +3 -0
- special_tokens_map.json +51 -0
- tokenizer.json +3 -0
- tokenizer_config.json +62 -0
.gitattributes
CHANGED
|
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
|
| 33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
| 34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
| 35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
| 33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
| 34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
| 35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
| 36 |
+
tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
1_Pooling/config.json
ADDED
|
@@ -0,0 +1,10 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"word_embedding_dimension": 768,
|
| 3 |
+
"pooling_mode_cls_token": false,
|
| 4 |
+
"pooling_mode_mean_tokens": true,
|
| 5 |
+
"pooling_mode_max_tokens": false,
|
| 6 |
+
"pooling_mode_mean_sqrt_len_tokens": false,
|
| 7 |
+
"pooling_mode_weightedmean_tokens": false,
|
| 8 |
+
"pooling_mode_lasttoken": false,
|
| 9 |
+
"include_prompt": true
|
| 10 |
+
}
|
README.md
ADDED
|
@@ -0,0 +1,501 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
---
|
| 2 |
+
tags:
|
| 3 |
+
- sentence-transformers
|
| 4 |
+
- sentence-similarity
|
| 5 |
+
- feature-extraction
|
| 6 |
+
- generated_from_trainer
|
| 7 |
+
- dataset_size:2000
|
| 8 |
+
- loss:MultipleNegativesRankingLoss
|
| 9 |
+
base_model: sentence-transformers/paraphrase-multilingual-mpnet-base-v2
|
| 10 |
+
widget:
|
| 11 |
+
- source_sentence: What is a story about a student in Japan, caught between the Britannian
|
| 12 |
+
and Area 11 forces in the year 2010, who gains the power to command absolute obedience
|
| 13 |
+
and leads a rebellion against the Holy Empire of Britannia?
|
| 14 |
+
sentences:
|
| 15 |
+
- Makoto Konno is in her last year of high school, but is having a hard time deciding
|
| 16 |
+
what to do with her future. In between enduring the pressure of her teachers and
|
| 17 |
+
killing time with her best friends, Makoto's life suddenly changes when she accidentally
|
| 18 |
+
discovers that she is capable of literally leaping through time. Toki wo Kakeru
|
| 19 |
+
Shoujo follows Makoto as she plays around with her newfound power. However, she
|
| 20 |
+
soon learns the hard way that every choice has a consequence, and time is a lot
|
| 21 |
+
more complicated than it may seem.
|
| 22 |
+
- Wishing to be independent, 16-year-old Maika Sakuranomiya is desperate to nail
|
| 23 |
+
down a part-time job so that she can afford to study abroad. Unfortunately, her
|
| 24 |
+
applications are constantly rejected due to the menacing look she unintentionally
|
| 25 |
+
makes whenever she smiles, despite her otherwise cheerful disposition. After yet
|
| 26 |
+
another failed interview, she chances upon Café Stile, a coffee shop where the
|
| 27 |
+
servers interact with the customers while roleplaying distinctive characteristics.
|
| 28 |
+
The Italian store manager, Dino, becomes infatuated with Maika's cuteness at first
|
| 29 |
+
sight, and offers her a job as a waitress with a sadistic nature. Coupled with
|
| 30 |
+
her inherent clumsiness, she successfully manages to serve a pair of masochistic
|
| 31 |
+
customers in accordance with her new, ruthless persona. Alongside Kaho Hinata
|
| 32 |
+
as the tsundere and Mafuyu Hoshikawa as the younger sister, Maika decides to make
|
| 33 |
+
the most out of her unique quirk and cements her position in the cafe with merciless
|
| 34 |
+
cruelty!
|
| 35 |
+
- In the year 2010, the Holy Empire of Britannia is establishing itself as a dominant
|
| 36 |
+
military nation, starting with the conquest of Japan. Renamed to Area 11 after
|
| 37 |
+
its swift defeat, Japan has seen significant resistance against these tyrants
|
| 38 |
+
in an attempt to regain independence. Lelouch Lamperouge, a Britannian student,
|
| 39 |
+
unfortunately finds himself caught in a crossfire between the Britannian and the
|
| 40 |
+
Area 11 rebel armed forces. He is able to escape, however, thanks to the timely
|
| 41 |
+
appearance of a mysterious girl named C.C., who bestows upon him Geass, the "Power
|
| 42 |
+
of Kings." Realizing the vast potential of his newfound "power of absolute obedience,"
|
| 43 |
+
Lelouch embarks upon a perilous journey as the masked vigilante known as Zero,
|
| 44 |
+
leading a merciless onslaught against Britannia in order to get revenge once and
|
| 45 |
+
for all.
|
| 46 |
+
- source_sentence: '"Find an anime where a group of new demon slayers, including Tanjirou
|
| 47 |
+
Kamado, Zenitsu Agatsuma, and Inosuke Hashibira, team up with the Flame Pillar,
|
| 48 |
+
Kyoujurou Rengoku, to investigate mysterious disappearances on a train and face
|
| 49 |
+
off against powerful demonic forces to save the passengers."'
|
| 50 |
+
sentences:
|
| 51 |
+
- 'Fear, survival, instinct. Thrown into a foreign land with nothing but hazy memories
|
| 52 |
+
and the knowledge of their name, they can feel only these three emotions resonating
|
| 53 |
+
deep within their souls. A group of strangers is given no other choice than to
|
| 54 |
+
accept the only paying job in this game-like world—the role of a soldier in the
|
| 55 |
+
Reserve Army—and eliminate anything that threatens the peace in their new world,
|
| 56 |
+
Grimgar. When all of the stronger candidates join together, those left behind
|
| 57 |
+
must create a party together to survive: Manato, a charismatic leader and priest;
|
| 58 |
+
Haruhiro, a nervous thief; Yume, a cheerful hunter; Shihoru, a shy mage; Moguzo,
|
| 59 |
+
a kind warrior; and Ranta, a rowdy dark knight. Despite its resemblance to one,
|
| 60 |
+
this is no game—there are no redos or respawns; it is kill or be killed. It is
|
| 61 |
+
now up to this ragtag group of unlikely fighters to survive together in a world
|
| 62 |
+
where life and death are separated only by a fine line.'
|
| 63 |
+
- Genius thief Arsene Lupin III—along with the usual crew of Goemon Ishikawa XIII,
|
| 64 |
+
Fujiko Mine, and Daisuke Jigen—finds himself in modern-day France, where he encounters
|
| 65 |
+
both new and old adversaries, with Inspector Kouichi Zenigata still hot on his
|
| 66 |
+
trail. As they steal from darker, more sinister entities, they will also have
|
| 67 |
+
to find a way to deal with the newest technology in their escapades, as well as
|
| 68 |
+
face the ghosts of their pasts. However, this time, Lupin's choices begin to catch
|
| 69 |
+
up with him as his pursuers use every tool at their disposal to take him down
|
| 70 |
+
once and for all.
|
| 71 |
+
- 'After a string of mysterious disappearances begin to plague a train, the Demon
|
| 72 |
+
Slayer Corps'' multiple attempts to remedy the problem prove fruitless. To prevent
|
| 73 |
+
further casualties, the Flame Pillar, Kyoujurou Rengoku, takes it upon himself
|
| 74 |
+
to eliminate the threat. Accompanying him are some of the Corps'' most promising
|
| 75 |
+
new blood: Tanjirou Kamado, Zenitsu Agatsuma, and Inosuke Hashibira, who all hope
|
| 76 |
+
to witness the fiery feats of this model demon slayer firsthand. Unbeknownst to
|
| 77 |
+
them, the demonic forces responsible for the disappearances have already put their
|
| 78 |
+
sinister plan in motion. Under this demonic presence, the group must muster every
|
| 79 |
+
ounce of their willpower and draw their swords to save all two hundred passengers
|
| 80 |
+
onboard. As things begin to spiral out of control, Tanjirou''s resolve and commitment
|
| 81 |
+
to duty are put to the test.'
|
| 82 |
+
- source_sentence: '"What is a query for an anime about a team competing in intense
|
| 83 |
+
battles at their agency headquarters to secure a spot in an upcoming mission,
|
| 84 |
+
undergoing training with a new member and facing internal disputes?"'
|
| 85 |
+
sentences:
|
| 86 |
+
- At the Border Defense Agency's headquarters, the B-Rank Wars are underway as each
|
| 87 |
+
team fights intensely to secure a spot in the upcoming Away Mission. Though Osamu
|
| 88 |
+
Mikumo and the rest of Tamakoma-2 have pulled through thus far, the final rounds
|
| 89 |
+
will require them to push far beyond the limits of their current abilities. Taking
|
| 90 |
+
in a talented new member, the squad begins to train and develop new strategies,
|
| 91 |
+
but, amid these efforts, the team is shaken by a heated dispute—one that could
|
| 92 |
+
jeopardize their ticket to the Neighbor's dimension.
|
| 93 |
+
- Kyousuke Kasuga is no stranger to being the new kid at school. Despite only being
|
| 94 |
+
a third-year middle schooler, he has spent his entire childhood avoiding those
|
| 95 |
+
who discover his family's paranormal powers, and he has had to change schools
|
| 96 |
+
seven times as a result. Upon catching a beautiful girl's hat, he becomes optimistic
|
| 97 |
+
and hopes that he and his family have finally moved for the last time. When Kyousuke
|
| 98 |
+
gets to school, however, he learns a different story. The elegant girl he just
|
| 99 |
+
met turns out to be none other than Madoka Ayukawa—also known as "Madoka the Pick"—a
|
| 100 |
+
delinquent known to smoke, drink, and get into fights. Her best friend is first-year
|
| 101 |
+
Hikaru Hiyama, a childish and energetic girl who quickly falls in love with Kyousuke.
|
| 102 |
+
Enamored with both girls, Kyousuke tries to balance a delicate triangle of emotions,
|
| 103 |
+
all while dealing with the antics brought about by a family with paranormal powers.
|
| 104 |
+
- At Shirahamazaka High School, a special recital is held every year in which music
|
| 105 |
+
students are able to showcase their talents in front of professionals and other
|
| 106 |
+
prestigious guests. Third-year Konatsu Miyamoto desperately wants to sing in her
|
| 107 |
+
last high school recital, but because she screwed up the year before, the vice
|
| 108 |
+
principal has barred her from participating. That's when Konatsu comes up with
|
| 109 |
+
a new plan to get involved; instead of joining the official choir, she'll form
|
| 110 |
+
her own singing club with her friends! Unfortunately this proves to be harder
|
| 111 |
+
than she imagined. Her friend Wakana Sakai has given up on singing, for one, and
|
| 112 |
+
Konatsu needs more than just two members. With only a month left until the recital,
|
| 113 |
+
will Konatsu be able to find enough members for her club and actually be ready
|
| 114 |
+
to sing at one of the most important events of the school year and graduate without
|
| 115 |
+
regrets?
|
| 116 |
+
- source_sentence: What is a romantic comedy anime about a man who keeps getting into
|
| 117 |
+
lewd situations with women, including an alien princess and her twin sisters,
|
| 118 |
+
while also dealing with a weapon girl trying to kill him?
|
| 119 |
+
sentences:
|
| 120 |
+
- Love, Miki and Inori are on their way to a dance contest, but get lost on their
|
| 121 |
+
way to Minato Mirai. Still looking for their way, they are attacked by a monster.
|
| 122 |
+
When the three Fresh Precure girls start to fight it, other Precures show up to
|
| 123 |
+
support them. They all have to combine their powers to win against this mighty
|
| 124 |
+
enemy.
|
| 125 |
+
- Although learning different languages continues to be an interest for Shinobu
|
| 126 |
+
and her friends, the new school year brings unexpected difficulties. Not only
|
| 127 |
+
is there always something new and different to distract them from their studies,
|
| 128 |
+
but Alice and Yoko also are having trouble adjusting to being in a different class
|
| 129 |
+
from Shinobu and Aya. Meanwhile, Karen isn't getting along at all with her new
|
| 130 |
+
homeroom teacher, and it doesn't help that the teacher is having trouble figuring
|
| 131 |
+
out how to make herself seem friendlier to her students as well. Craziness may
|
| 132 |
+
ensue, but sometimes, all it takes is the right mutual experience to bring everyone
|
| 133 |
+
together. While some of those experiences may not be as well-thought-out as others
|
| 134 |
+
(like when Alice and Aya act like juvenile delinquents to seem more grown up),
|
| 135 |
+
the gang's new adventures are certain to warm everyone's heart as the fun and
|
| 136 |
+
friendships keep growing in HELLO!! KINMOZA!
|
| 137 |
+
- 'Rito Yuuki never gets a break—he''s always finding himself in lewd accidents
|
| 138 |
+
with girls around him. Although his heart still yearns for Haruna, his childhood
|
| 139 |
+
love, Rito can''t help but question his feelings for Lala, the alien princess
|
| 140 |
+
who appeared in front of him and declared she would marry him. But now, it''s
|
| 141 |
+
not just Lala he has to deal with: her younger twin sisters, Momo and Nana, have
|
| 142 |
+
also traveled to Earth, wanting to meet their older sister''s fiancé, and just
|
| 143 |
+
as luck would have it, they end up staying at Rito''s home. Meanwhile, amidst
|
| 144 |
+
the bustle of his new family members, Yami, the human weapon girl, begins her
|
| 145 |
+
pursuit for Rito. It''s not an easy life for Rito as he deals with uncertain love,
|
| 146 |
+
punishment for being a pervert, and a girl dead set on murdering him.'
|
| 147 |
+
- source_sentence: What is the story about a haunted school where the ghosts seek
|
| 148 |
+
revenge on the students who banished them years ago?
|
| 149 |
+
sentences:
|
| 150 |
+
- Years ago, all of the ghosts in a haunted schoolhouse were banished by a certain
|
| 151 |
+
student. Now, they're back—and they want revenge... Satsuki and Keiichirou Miyanoshita
|
| 152 |
+
are two siblings recovering from the tragic loss of their mother. After moving
|
| 153 |
+
to their mother's hometown, they learn that the local school they have transferred
|
| 154 |
+
to is an old building—one said to be haunted. Despite initially brushing it off
|
| 155 |
+
as a silly rumor, the two soon discover that ghosts are indeed real and that they're
|
| 156 |
+
after them! Gakkou no Kaidan is the creepy tale of the lives of these siblings
|
| 157 |
+
and their newfound friends as they try to survive the school's ghosts—with a little
|
| 158 |
+
help from their pet cat along the way.
|
| 159 |
+
- 'The villainous Dr. Hell has amassed an army of mechanical beasts in his secret
|
| 160 |
+
hideaway, the island of Bardos located in the Aegean Sea. He is capable of controlling
|
| 161 |
+
mechanized beasts with his cane, and instructs them to unleash devastating attacks.
|
| 162 |
+
However, Dr. Hell doesn''t do all the dirty work by himself; he has his loyal
|
| 163 |
+
henchman Baron Ashura to carry out his devilish plans. There are also those that
|
| 164 |
+
will see to it that evil does not prevail. Kouji Kabuto is the young and feisty
|
| 165 |
+
teenager with a score to settle: his goal is avenging the murder of his grandfather
|
| 166 |
+
by Dr. Hell. And he might just be able to pull it off, as he is the pilot of Mazinger
|
| 167 |
+
Z, a mighty giant robot made out of an indestructible metal known as Super-Alloy
|
| 168 |
+
Z. Mazinger Z boasts several powerful special attacks. By channeling Photonic
|
| 169 |
+
Energy through its eyes, and unleashing the Koushiryoku Beam, it can cause great
|
| 170 |
+
destruction. But things get really cool when Mazinger Z launches its Rocket Punch
|
| 171 |
+
attack. Dr. Hell and his minions might have just found their match!'
|
| 172 |
+
- The final hour of the popular virtual reality game Yggdrasil has come. However,
|
| 173 |
+
Momonga, a powerful wizard and master of the dark guild Ainz Ooal Gown, decides
|
| 174 |
+
to spend his last few moments in the game as the servers begin to shut down. To
|
| 175 |
+
his surprise, despite the clock having struck midnight, Momonga is still fully
|
| 176 |
+
conscious as his character and, moreover, the non-player characters appear to
|
| 177 |
+
have developed personalities of their own! Confronted with this abnormal situation,
|
| 178 |
+
Momonga commands his loyal servants to help him investigate and take control of
|
| 179 |
+
this new world, with the hopes of figuring out what has caused this development
|
| 180 |
+
and if there may be others in the same predicament.
|
| 181 |
+
pipeline_tag: sentence-similarity
|
| 182 |
+
library_name: sentence-transformers
|
| 183 |
+
---
|
| 184 |
+
|
| 185 |
+
# SentenceTransformer based on sentence-transformers/paraphrase-multilingual-mpnet-base-v2
|
| 186 |
+
|
| 187 |
+
This is a [sentence-transformers](https://www.SBERT.net) model finetuned from [sentence-transformers/paraphrase-multilingual-mpnet-base-v2](https://huggingface.co/sentence-transformers/paraphrase-multilingual-mpnet-base-v2). It maps sentences & paragraphs to a 768-dimensional dense vector space and can be used for semantic textual similarity, semantic search, paraphrase mining, text classification, clustering, and more.
|
| 188 |
+
|
| 189 |
+
## Model Details
|
| 190 |
+
|
| 191 |
+
### Model Description
|
| 192 |
+
- **Model Type:** Sentence Transformer
|
| 193 |
+
- **Base model:** [sentence-transformers/paraphrase-multilingual-mpnet-base-v2](https://huggingface.co/sentence-transformers/paraphrase-multilingual-mpnet-base-v2) <!-- at revision 84fccfe766bcfd679e39efefe4ebf45af190ad2d -->
|
| 194 |
+
- **Maximum Sequence Length:** 128 tokens
|
| 195 |
+
- **Output Dimensionality:** 768 dimensions
|
| 196 |
+
- **Similarity Function:** Cosine Similarity
|
| 197 |
+
<!-- - **Training Dataset:** Unknown -->
|
| 198 |
+
<!-- - **Language:** Unknown -->
|
| 199 |
+
<!-- - **License:** Unknown -->
|
| 200 |
+
|
| 201 |
+
### Model Sources
|
| 202 |
+
|
| 203 |
+
- **Documentation:** [Sentence Transformers Documentation](https://sbert.net)
|
| 204 |
+
- **Repository:** [Sentence Transformers on GitHub](https://github.com/UKPLab/sentence-transformers)
|
| 205 |
+
- **Hugging Face:** [Sentence Transformers on Hugging Face](https://huggingface.co/models?library=sentence-transformers)
|
| 206 |
+
|
| 207 |
+
### Full Model Architecture
|
| 208 |
+
|
| 209 |
+
```
|
| 210 |
+
SentenceTransformer(
|
| 211 |
+
(0): Transformer({'max_seq_length': 128, 'do_lower_case': False}) with Transformer model: XLMRobertaModel
|
| 212 |
+
(1): Pooling({'word_embedding_dimension': 768, 'pooling_mode_cls_token': False, 'pooling_mode_mean_tokens': True, 'pooling_mode_max_tokens': False, 'pooling_mode_mean_sqrt_len_tokens': False, 'pooling_mode_weightedmean_tokens': False, 'pooling_mode_lasttoken': False, 'include_prompt': True})
|
| 213 |
+
)
|
| 214 |
+
```
|
| 215 |
+
|
| 216 |
+
## Usage
|
| 217 |
+
|
| 218 |
+
### Direct Usage (Sentence Transformers)
|
| 219 |
+
|
| 220 |
+
First install the Sentence Transformers library:
|
| 221 |
+
|
| 222 |
+
```bash
|
| 223 |
+
pip install -U sentence-transformers
|
| 224 |
+
```
|
| 225 |
+
|
| 226 |
+
Then you can load this model and run inference.
|
| 227 |
+
```python
|
| 228 |
+
from sentence_transformers import SentenceTransformer
|
| 229 |
+
|
| 230 |
+
# Download from the 🤗 Hub
|
| 231 |
+
model = SentenceTransformer("KiruruP/anime-recommendation-multilingual-mpnet-base-v2-v2")
|
| 232 |
+
# Run inference
|
| 233 |
+
sentences = [
|
| 234 |
+
'What is the story about a haunted school where the ghosts seek revenge on the students who banished them years ago?',
|
| 235 |
+
"Years ago, all of the ghosts in a haunted schoolhouse were banished by a certain student. Now, they're back—and they want revenge... Satsuki and Keiichirou Miyanoshita are two siblings recovering from the tragic loss of their mother. After moving to their mother's hometown, they learn that the local school they have transferred to is an old building—one said to be haunted. Despite initially brushing it off as a silly rumor, the two soon discover that ghosts are indeed real and that they're after them! Gakkou no Kaidan is the creepy tale of the lives of these siblings and their newfound friends as they try to survive the school's ghosts—with a little help from their pet cat along the way.",
|
| 236 |
+
'The final hour of the popular virtual reality game Yggdrasil has come. However, Momonga, a powerful wizard and master of the dark guild Ainz Ooal Gown, decides to spend his last few moments in the game as the servers begin to shut down. To his surprise, despite the clock having struck midnight, Momonga is still fully conscious as his character and, moreover, the non-player characters appear to have developed personalities of their own! Confronted with this abnormal situation, Momonga commands his loyal servants to help him investigate and take control of this new world, with the hopes of figuring out what has caused this development and if there may be others in the same predicament.',
|
| 237 |
+
]
|
| 238 |
+
embeddings = model.encode(sentences)
|
| 239 |
+
print(embeddings.shape)
|
| 240 |
+
# [3, 768]
|
| 241 |
+
|
| 242 |
+
# Get the similarity scores for the embeddings
|
| 243 |
+
similarities = model.similarity(embeddings, embeddings)
|
| 244 |
+
print(similarities.shape)
|
| 245 |
+
# [3, 3]
|
| 246 |
+
```
|
| 247 |
+
|
| 248 |
+
<!--
|
| 249 |
+
### Direct Usage (Transformers)
|
| 250 |
+
|
| 251 |
+
<details><summary>Click to see the direct usage in Transformers</summary>
|
| 252 |
+
|
| 253 |
+
</details>
|
| 254 |
+
-->
|
| 255 |
+
|
| 256 |
+
<!--
|
| 257 |
+
### Downstream Usage (Sentence Transformers)
|
| 258 |
+
|
| 259 |
+
You can finetune this model on your own dataset.
|
| 260 |
+
|
| 261 |
+
<details><summary>Click to expand</summary>
|
| 262 |
+
|
| 263 |
+
</details>
|
| 264 |
+
-->
|
| 265 |
+
|
| 266 |
+
<!--
|
| 267 |
+
### Out-of-Scope Use
|
| 268 |
+
|
| 269 |
+
*List how the model may foreseeably be misused and address what users ought not to do with the model.*
|
| 270 |
+
-->
|
| 271 |
+
|
| 272 |
+
<!--
|
| 273 |
+
## Bias, Risks and Limitations
|
| 274 |
+
|
| 275 |
+
*What are the known or foreseeable issues stemming from this model? You could also flag here known failure cases or weaknesses of the model.*
|
| 276 |
+
-->
|
| 277 |
+
|
| 278 |
+
<!--
|
| 279 |
+
### Recommendations
|
| 280 |
+
|
| 281 |
+
*What are recommendations with respect to the foreseeable issues? For example, filtering explicit content.*
|
| 282 |
+
-->
|
| 283 |
+
|
| 284 |
+
## Training Details
|
| 285 |
+
|
| 286 |
+
### Training Dataset
|
| 287 |
+
|
| 288 |
+
#### Unnamed Dataset
|
| 289 |
+
|
| 290 |
+
* Size: 2,000 training samples
|
| 291 |
+
* Columns: <code>sentence_0</code> and <code>sentence_1</code>
|
| 292 |
+
* Approximate statistics based on the first 1000 samples:
|
| 293 |
+
| | sentence_0 | sentence_1 |
|
| 294 |
+
|:--------|:-----------------------------------------------------------------------------------|:------------------------------------------------------------------------------------|
|
| 295 |
+
| type | string | string |
|
| 296 |
+
| details | <ul><li>min: 18 tokens</li><li>mean: 47.9 tokens</li><li>max: 128 tokens</li></ul> | <ul><li>min: 51 tokens</li><li>mean: 122.5 tokens</li><li>max: 128 tokens</li></ul> |
|
| 297 |
+
* Samples:
|
| 298 |
+
| sentence_0 | sentence_1 |
|
| 299 |
+
|:--------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|:---------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|
|
| 300 |
+
| <code>What is the query for a story about a teenager seeking revenge on a villainous scientist with an army of mechanical beasts, located on an island in the Aegean Sea, who controls them with a cane, and has a loyal henchman? The teenager pilots a powerful robot made of indestructible metal to stop them.</code> | <code>The villainous Dr. Hell has amassed an army of mechanical beasts in his secret hideaway, the island of Bardos located in the Aegean Sea. He is capable of controlling mechanized beasts with his cane, and instructs them to unleash devastating attacks. However, Dr. Hell doesn't do all the dirty work by himself; he has his loyal henchman Baron Ashura to carry out his devilish plans. There are also those that will see to it that evil does not prevail. Kouji Kabuto is the young and feisty teenager with a score to settle: his goal is avenging the murder of his grandfather by Dr. Hell. And he might just be able to pull it off, as he is the pilot of Mazinger Z, a mighty giant robot made out of an indestructible metal known as Super-Alloy Z. Mazinger Z boasts several powerful special attacks. By channeling Photonic Energy through its eyes, and unleashing the Koushiryoku Beam, it can cause great destruction. But things get really cool when Mazinger Z launches its Rocket Punch attack. Dr. Hell and...</code> |
|
| 301 |
+
| <code>What is a manga about a struggling artist named Da Shu who finds companionship with a young man with cat ears?</code> | <code>Da Shu is a a manga creator who grew up in an orphanage, and whose works do not sell very well. Da Shu lives each lonely day in boredom, but one day he meets a young man named Miao who has cat ears, and his everyday life completely changes. Miao gets in trouble every day, but for the first time in his life, Da Shu's heart experiences "warmth."</code> |
|
| 302 |
+
| <code>What is a group of amnesiac strangers forced to become soldiers in a dangerous world called, where they must form a party to survive?</code> | <code>Fear, survival, instinct. Thrown into a foreign land with nothing but hazy memories and the knowledge of their name, they can feel only these three emotions resonating deep within their souls. A group of strangers is given no other choice than to accept the only paying job in this game-like world—the role of a soldier in the Reserve Army—and eliminate anything that threatens the peace in their new world, Grimgar. When all of the stronger candidates join together, those left behind must create a party together to survive: Manato, a charismatic leader and priest; Haruhiro, a nervous thief; Yume, a cheerful hunter; Shihoru, a shy mage; Moguzo, a kind warrior; and Ranta, a rowdy dark knight. Despite its resemblance to one, this is no game—there are no redos or respawns; it is kill or be killed. It is now up to this ragtag group of unlikely fighters to survive together in a world where life and death are separated only by a fine line.</code> |
|
| 303 |
+
* Loss: [<code>MultipleNegativesRankingLoss</code>](https://sbert.net/docs/package_reference/sentence_transformer/losses.html#multiplenegativesrankingloss) with these parameters:
|
| 304 |
+
```json
|
| 305 |
+
{
|
| 306 |
+
"scale": 20.0,
|
| 307 |
+
"similarity_fct": "cos_sim"
|
| 308 |
+
}
|
| 309 |
+
```
|
| 310 |
+
|
| 311 |
+
### Training Hyperparameters
|
| 312 |
+
#### Non-Default Hyperparameters
|
| 313 |
+
|
| 314 |
+
- `per_device_train_batch_size`: 16
|
| 315 |
+
- `per_device_eval_batch_size`: 16
|
| 316 |
+
- `num_train_epochs`: 10
|
| 317 |
+
- `multi_dataset_batch_sampler`: round_robin
|
| 318 |
+
|
| 319 |
+
#### All Hyperparameters
|
| 320 |
+
<details><summary>Click to expand</summary>
|
| 321 |
+
|
| 322 |
+
- `overwrite_output_dir`: False
|
| 323 |
+
- `do_predict`: False
|
| 324 |
+
- `eval_strategy`: no
|
| 325 |
+
- `prediction_loss_only`: True
|
| 326 |
+
- `per_device_train_batch_size`: 16
|
| 327 |
+
- `per_device_eval_batch_size`: 16
|
| 328 |
+
- `per_gpu_train_batch_size`: None
|
| 329 |
+
- `per_gpu_eval_batch_size`: None
|
| 330 |
+
- `gradient_accumulation_steps`: 1
|
| 331 |
+
- `eval_accumulation_steps`: None
|
| 332 |
+
- `torch_empty_cache_steps`: None
|
| 333 |
+
- `learning_rate`: 5e-05
|
| 334 |
+
- `weight_decay`: 0.0
|
| 335 |
+
- `adam_beta1`: 0.9
|
| 336 |
+
- `adam_beta2`: 0.999
|
| 337 |
+
- `adam_epsilon`: 1e-08
|
| 338 |
+
- `max_grad_norm`: 1
|
| 339 |
+
- `num_train_epochs`: 10
|
| 340 |
+
- `max_steps`: -1
|
| 341 |
+
- `lr_scheduler_type`: linear
|
| 342 |
+
- `lr_scheduler_kwargs`: {}
|
| 343 |
+
- `warmup_ratio`: 0.0
|
| 344 |
+
- `warmup_steps`: 0
|
| 345 |
+
- `log_level`: passive
|
| 346 |
+
- `log_level_replica`: warning
|
| 347 |
+
- `log_on_each_node`: True
|
| 348 |
+
- `logging_nan_inf_filter`: True
|
| 349 |
+
- `save_safetensors`: True
|
| 350 |
+
- `save_on_each_node`: False
|
| 351 |
+
- `save_only_model`: False
|
| 352 |
+
- `restore_callback_states_from_checkpoint`: False
|
| 353 |
+
- `no_cuda`: False
|
| 354 |
+
- `use_cpu`: False
|
| 355 |
+
- `use_mps_device`: False
|
| 356 |
+
- `seed`: 42
|
| 357 |
+
- `data_seed`: None
|
| 358 |
+
- `jit_mode_eval`: False
|
| 359 |
+
- `use_ipex`: False
|
| 360 |
+
- `bf16`: False
|
| 361 |
+
- `fp16`: False
|
| 362 |
+
- `fp16_opt_level`: O1
|
| 363 |
+
- `half_precision_backend`: auto
|
| 364 |
+
- `bf16_full_eval`: False
|
| 365 |
+
- `fp16_full_eval`: False
|
| 366 |
+
- `tf32`: None
|
| 367 |
+
- `local_rank`: 0
|
| 368 |
+
- `ddp_backend`: None
|
| 369 |
+
- `tpu_num_cores`: None
|
| 370 |
+
- `tpu_metrics_debug`: False
|
| 371 |
+
- `debug`: []
|
| 372 |
+
- `dataloader_drop_last`: False
|
| 373 |
+
- `dataloader_num_workers`: 0
|
| 374 |
+
- `dataloader_prefetch_factor`: None
|
| 375 |
+
- `past_index`: -1
|
| 376 |
+
- `disable_tqdm`: False
|
| 377 |
+
- `remove_unused_columns`: True
|
| 378 |
+
- `label_names`: None
|
| 379 |
+
- `load_best_model_at_end`: False
|
| 380 |
+
- `ignore_data_skip`: False
|
| 381 |
+
- `fsdp`: []
|
| 382 |
+
- `fsdp_min_num_params`: 0
|
| 383 |
+
- `fsdp_config`: {'min_num_params': 0, 'xla': False, 'xla_fsdp_v2': False, 'xla_fsdp_grad_ckpt': False}
|
| 384 |
+
- `fsdp_transformer_layer_cls_to_wrap`: None
|
| 385 |
+
- `accelerator_config`: {'split_batches': False, 'dispatch_batches': None, 'even_batches': True, 'use_seedable_sampler': True, 'non_blocking': False, 'gradient_accumulation_kwargs': None}
|
| 386 |
+
- `deepspeed`: None
|
| 387 |
+
- `label_smoothing_factor`: 0.0
|
| 388 |
+
- `optim`: adamw_torch
|
| 389 |
+
- `optim_args`: None
|
| 390 |
+
- `adafactor`: False
|
| 391 |
+
- `group_by_length`: False
|
| 392 |
+
- `length_column_name`: length
|
| 393 |
+
- `ddp_find_unused_parameters`: None
|
| 394 |
+
- `ddp_bucket_cap_mb`: None
|
| 395 |
+
- `ddp_broadcast_buffers`: False
|
| 396 |
+
- `dataloader_pin_memory`: True
|
| 397 |
+
- `dataloader_persistent_workers`: False
|
| 398 |
+
- `skip_memory_metrics`: True
|
| 399 |
+
- `use_legacy_prediction_loop`: False
|
| 400 |
+
- `push_to_hub`: False
|
| 401 |
+
- `resume_from_checkpoint`: None
|
| 402 |
+
- `hub_model_id`: None
|
| 403 |
+
- `hub_strategy`: every_save
|
| 404 |
+
- `hub_private_repo`: None
|
| 405 |
+
- `hub_always_push`: False
|
| 406 |
+
- `hub_revision`: None
|
| 407 |
+
- `gradient_checkpointing`: False
|
| 408 |
+
- `gradient_checkpointing_kwargs`: None
|
| 409 |
+
- `include_inputs_for_metrics`: False
|
| 410 |
+
- `include_for_metrics`: []
|
| 411 |
+
- `eval_do_concat_batches`: True
|
| 412 |
+
- `fp16_backend`: auto
|
| 413 |
+
- `push_to_hub_model_id`: None
|
| 414 |
+
- `push_to_hub_organization`: None
|
| 415 |
+
- `mp_parameters`:
|
| 416 |
+
- `auto_find_batch_size`: False
|
| 417 |
+
- `full_determinism`: False
|
| 418 |
+
- `torchdynamo`: None
|
| 419 |
+
- `ray_scope`: last
|
| 420 |
+
- `ddp_timeout`: 1800
|
| 421 |
+
- `torch_compile`: False
|
| 422 |
+
- `torch_compile_backend`: None
|
| 423 |
+
- `torch_compile_mode`: None
|
| 424 |
+
- `include_tokens_per_second`: False
|
| 425 |
+
- `include_num_input_tokens_seen`: False
|
| 426 |
+
- `neftune_noise_alpha`: None
|
| 427 |
+
- `optim_target_modules`: None
|
| 428 |
+
- `batch_eval_metrics`: False
|
| 429 |
+
- `eval_on_start`: False
|
| 430 |
+
- `use_liger_kernel`: False
|
| 431 |
+
- `liger_kernel_config`: None
|
| 432 |
+
- `eval_use_gather_object`: False
|
| 433 |
+
- `average_tokens_across_devices`: False
|
| 434 |
+
- `prompts`: None
|
| 435 |
+
- `batch_sampler`: batch_sampler
|
| 436 |
+
- `multi_dataset_batch_sampler`: round_robin
|
| 437 |
+
|
| 438 |
+
</details>
|
| 439 |
+
|
| 440 |
+
### Training Logs
|
| 441 |
+
| Epoch | Step | Training Loss |
|
| 442 |
+
|:-----:|:----:|:-------------:|
|
| 443 |
+
| 4.0 | 500 | 0.0258 |
|
| 444 |
+
| 8.0 | 1000 | 0.0015 |
|
| 445 |
+
|
| 446 |
+
|
| 447 |
+
### Framework Versions
|
| 448 |
+
- Python: 3.11.13
|
| 449 |
+
- Sentence Transformers: 4.1.0
|
| 450 |
+
- Transformers: 4.54.0
|
| 451 |
+
- PyTorch: 2.6.0+cu124
|
| 452 |
+
- Accelerate: 1.9.0
|
| 453 |
+
- Datasets: 4.0.0
|
| 454 |
+
- Tokenizers: 0.21.2
|
| 455 |
+
|
| 456 |
+
## Citation
|
| 457 |
+
|
| 458 |
+
### BibTeX
|
| 459 |
+
|
| 460 |
+
#### Sentence Transformers
|
| 461 |
+
```bibtex
|
| 462 |
+
@inproceedings{reimers-2019-sentence-bert,
|
| 463 |
+
title = "Sentence-BERT: Sentence Embeddings using Siamese BERT-Networks",
|
| 464 |
+
author = "Reimers, Nils and Gurevych, Iryna",
|
| 465 |
+
booktitle = "Proceedings of the 2019 Conference on Empirical Methods in Natural Language Processing",
|
| 466 |
+
month = "11",
|
| 467 |
+
year = "2019",
|
| 468 |
+
publisher = "Association for Computational Linguistics",
|
| 469 |
+
url = "https://arxiv.org/abs/1908.10084",
|
| 470 |
+
}
|
| 471 |
+
```
|
| 472 |
+
|
| 473 |
+
#### MultipleNegativesRankingLoss
|
| 474 |
+
```bibtex
|
| 475 |
+
@misc{henderson2017efficient,
|
| 476 |
+
title={Efficient Natural Language Response Suggestion for Smart Reply},
|
| 477 |
+
author={Matthew Henderson and Rami Al-Rfou and Brian Strope and Yun-hsuan Sung and Laszlo Lukacs and Ruiqi Guo and Sanjiv Kumar and Balint Miklos and Ray Kurzweil},
|
| 478 |
+
year={2017},
|
| 479 |
+
eprint={1705.00652},
|
| 480 |
+
archivePrefix={arXiv},
|
| 481 |
+
primaryClass={cs.CL}
|
| 482 |
+
}
|
| 483 |
+
```
|
| 484 |
+
|
| 485 |
+
<!--
|
| 486 |
+
## Glossary
|
| 487 |
+
|
| 488 |
+
*Clearly define terms in order to be accessible across audiences.*
|
| 489 |
+
-->
|
| 490 |
+
|
| 491 |
+
<!--
|
| 492 |
+
## Model Card Authors
|
| 493 |
+
|
| 494 |
+
*Lists the people who create the model card, providing recognition and accountability for the detailed work that goes into its construction.*
|
| 495 |
+
-->
|
| 496 |
+
|
| 497 |
+
<!--
|
| 498 |
+
## Model Card Contact
|
| 499 |
+
|
| 500 |
+
*Provides a way for people who have updates to the Model Card, suggestions, or questions, to contact the Model Card authors.*
|
| 501 |
+
-->
|
config.json
ADDED
|
@@ -0,0 +1,28 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"architectures": [
|
| 3 |
+
"XLMRobertaModel"
|
| 4 |
+
],
|
| 5 |
+
"attention_probs_dropout_prob": 0.1,
|
| 6 |
+
"bos_token_id": 0,
|
| 7 |
+
"classifier_dropout": null,
|
| 8 |
+
"eos_token_id": 2,
|
| 9 |
+
"gradient_checkpointing": false,
|
| 10 |
+
"hidden_act": "gelu",
|
| 11 |
+
"hidden_dropout_prob": 0.1,
|
| 12 |
+
"hidden_size": 768,
|
| 13 |
+
"initializer_range": 0.02,
|
| 14 |
+
"intermediate_size": 3072,
|
| 15 |
+
"layer_norm_eps": 1e-05,
|
| 16 |
+
"max_position_embeddings": 514,
|
| 17 |
+
"model_type": "xlm-roberta",
|
| 18 |
+
"num_attention_heads": 12,
|
| 19 |
+
"num_hidden_layers": 12,
|
| 20 |
+
"output_past": true,
|
| 21 |
+
"pad_token_id": 1,
|
| 22 |
+
"position_embedding_type": "absolute",
|
| 23 |
+
"torch_dtype": "float32",
|
| 24 |
+
"transformers_version": "4.54.0",
|
| 25 |
+
"type_vocab_size": 1,
|
| 26 |
+
"use_cache": true,
|
| 27 |
+
"vocab_size": 250002
|
| 28 |
+
}
|
config_sentence_transformers.json
ADDED
|
@@ -0,0 +1,10 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"__version__": {
|
| 3 |
+
"sentence_transformers": "4.1.0",
|
| 4 |
+
"transformers": "4.54.0",
|
| 5 |
+
"pytorch": "2.6.0+cu124"
|
| 6 |
+
},
|
| 7 |
+
"prompts": {},
|
| 8 |
+
"default_prompt_name": null,
|
| 9 |
+
"similarity_fn_name": "cosine"
|
| 10 |
+
}
|
model.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c4b32037016952658bb6b71fb08f6684281300550d6440159513a99a388bc260
|
| 3 |
+
size 1112197096
|
modules.json
ADDED
|
@@ -0,0 +1,14 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
[
|
| 2 |
+
{
|
| 3 |
+
"idx": 0,
|
| 4 |
+
"name": "0",
|
| 5 |
+
"path": "",
|
| 6 |
+
"type": "sentence_transformers.models.Transformer"
|
| 7 |
+
},
|
| 8 |
+
{
|
| 9 |
+
"idx": 1,
|
| 10 |
+
"name": "1",
|
| 11 |
+
"path": "1_Pooling",
|
| 12 |
+
"type": "sentence_transformers.models.Pooling"
|
| 13 |
+
}
|
| 14 |
+
]
|
sentence_bert_config.json
ADDED
|
@@ -0,0 +1,4 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"max_seq_length": 128,
|
| 3 |
+
"do_lower_case": false
|
| 4 |
+
}
|
sentencepiece.bpe.model
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:cfc8146abe2a0488e9e2a0c56de7952f7c11ab059eca145a0a727afce0db2865
|
| 3 |
+
size 5069051
|
special_tokens_map.json
ADDED
|
@@ -0,0 +1,51 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"bos_token": {
|
| 3 |
+
"content": "<s>",
|
| 4 |
+
"lstrip": false,
|
| 5 |
+
"normalized": false,
|
| 6 |
+
"rstrip": false,
|
| 7 |
+
"single_word": false
|
| 8 |
+
},
|
| 9 |
+
"cls_token": {
|
| 10 |
+
"content": "<s>",
|
| 11 |
+
"lstrip": false,
|
| 12 |
+
"normalized": false,
|
| 13 |
+
"rstrip": false,
|
| 14 |
+
"single_word": false
|
| 15 |
+
},
|
| 16 |
+
"eos_token": {
|
| 17 |
+
"content": "</s>",
|
| 18 |
+
"lstrip": false,
|
| 19 |
+
"normalized": false,
|
| 20 |
+
"rstrip": false,
|
| 21 |
+
"single_word": false
|
| 22 |
+
},
|
| 23 |
+
"mask_token": {
|
| 24 |
+
"content": "<mask>",
|
| 25 |
+
"lstrip": true,
|
| 26 |
+
"normalized": false,
|
| 27 |
+
"rstrip": false,
|
| 28 |
+
"single_word": false
|
| 29 |
+
},
|
| 30 |
+
"pad_token": {
|
| 31 |
+
"content": "<pad>",
|
| 32 |
+
"lstrip": false,
|
| 33 |
+
"normalized": false,
|
| 34 |
+
"rstrip": false,
|
| 35 |
+
"single_word": false
|
| 36 |
+
},
|
| 37 |
+
"sep_token": {
|
| 38 |
+
"content": "</s>",
|
| 39 |
+
"lstrip": false,
|
| 40 |
+
"normalized": false,
|
| 41 |
+
"rstrip": false,
|
| 42 |
+
"single_word": false
|
| 43 |
+
},
|
| 44 |
+
"unk_token": {
|
| 45 |
+
"content": "<unk>",
|
| 46 |
+
"lstrip": false,
|
| 47 |
+
"normalized": false,
|
| 48 |
+
"rstrip": false,
|
| 49 |
+
"single_word": false
|
| 50 |
+
}
|
| 51 |
+
}
|
tokenizer.json
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:cad551d5600a84242d0973327029452a1e3672ba6313c2a3c3d69c4310e12719
|
| 3 |
+
size 17082987
|
tokenizer_config.json
ADDED
|
@@ -0,0 +1,62 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"added_tokens_decoder": {
|
| 3 |
+
"0": {
|
| 4 |
+
"content": "<s>",
|
| 5 |
+
"lstrip": false,
|
| 6 |
+
"normalized": false,
|
| 7 |
+
"rstrip": false,
|
| 8 |
+
"single_word": false,
|
| 9 |
+
"special": true
|
| 10 |
+
},
|
| 11 |
+
"1": {
|
| 12 |
+
"content": "<pad>",
|
| 13 |
+
"lstrip": false,
|
| 14 |
+
"normalized": false,
|
| 15 |
+
"rstrip": false,
|
| 16 |
+
"single_word": false,
|
| 17 |
+
"special": true
|
| 18 |
+
},
|
| 19 |
+
"2": {
|
| 20 |
+
"content": "</s>",
|
| 21 |
+
"lstrip": false,
|
| 22 |
+
"normalized": false,
|
| 23 |
+
"rstrip": false,
|
| 24 |
+
"single_word": false,
|
| 25 |
+
"special": true
|
| 26 |
+
},
|
| 27 |
+
"3": {
|
| 28 |
+
"content": "<unk>",
|
| 29 |
+
"lstrip": false,
|
| 30 |
+
"normalized": false,
|
| 31 |
+
"rstrip": false,
|
| 32 |
+
"single_word": false,
|
| 33 |
+
"special": true
|
| 34 |
+
},
|
| 35 |
+
"250001": {
|
| 36 |
+
"content": "<mask>",
|
| 37 |
+
"lstrip": true,
|
| 38 |
+
"normalized": false,
|
| 39 |
+
"rstrip": false,
|
| 40 |
+
"single_word": false,
|
| 41 |
+
"special": true
|
| 42 |
+
}
|
| 43 |
+
},
|
| 44 |
+
"bos_token": "<s>",
|
| 45 |
+
"clean_up_tokenization_spaces": false,
|
| 46 |
+
"cls_token": "<s>",
|
| 47 |
+
"eos_token": "</s>",
|
| 48 |
+
"extra_special_tokens": {},
|
| 49 |
+
"mask_token": "<mask>",
|
| 50 |
+
"max_length": 128,
|
| 51 |
+
"model_max_length": 128,
|
| 52 |
+
"pad_to_multiple_of": null,
|
| 53 |
+
"pad_token": "<pad>",
|
| 54 |
+
"pad_token_type_id": 0,
|
| 55 |
+
"padding_side": "right",
|
| 56 |
+
"sep_token": "</s>",
|
| 57 |
+
"stride": 0,
|
| 58 |
+
"tokenizer_class": "XLMRobertaTokenizer",
|
| 59 |
+
"truncation_side": "right",
|
| 60 |
+
"truncation_strategy": "longest_first",
|
| 61 |
+
"unk_token": "<unk>"
|
| 62 |
+
}
|