Add new SentenceTransformer model
Browse files- 1_Pooling/config.json +10 -0
- README.md +636 -0
- config.json +24 -0
- config_sentence_transformers.json +10 -0
- model.safetensors +3 -0
- modules.json +14 -0
- sentence_bert_config.json +4 -0
- special_tokens_map.json +51 -0
- tokenizer.json +0 -0
- tokenizer_config.json +66 -0
- vocab.txt +0 -0
1_Pooling/config.json
ADDED
@@ -0,0 +1,10 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"word_embedding_dimension": 768,
|
3 |
+
"pooling_mode_cls_token": false,
|
4 |
+
"pooling_mode_mean_tokens": true,
|
5 |
+
"pooling_mode_max_tokens": false,
|
6 |
+
"pooling_mode_mean_sqrt_len_tokens": false,
|
7 |
+
"pooling_mode_weightedmean_tokens": false,
|
8 |
+
"pooling_mode_lasttoken": false,
|
9 |
+
"include_prompt": true
|
10 |
+
}
|
README.md
ADDED
@@ -0,0 +1,636 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
---
|
2 |
+
language:
|
3 |
+
- en
|
4 |
+
license: apache-2.0
|
5 |
+
tags:
|
6 |
+
- sentence-transformers
|
7 |
+
- sentence-similarity
|
8 |
+
- feature-extraction
|
9 |
+
- generated_from_trainer
|
10 |
+
- dataset_size:6433
|
11 |
+
- loss:Infonce
|
12 |
+
base_model: microsoft/mpnet-base
|
13 |
+
widget:
|
14 |
+
- source_sentence: What surprised the author about the appearance of sloths when looking
|
15 |
+
for animals to draw for the letter S
|
16 |
+
sentences:
|
17 |
+
- "Third National Bank may refer to:\n\nin the United States\n(by state)\nThird\
|
18 |
+
\ National Bank (Atlanta, Georgia), now The Metropolitan (Atlanta condominium\
|
19 |
+
\ building)\n Third National Bank (Glasgow, Kentucky), listed on the NRHP in Kentucky\n\
|
20 |
+
\ Third National Bank (Ohio), a predecessor of Fifth Third Bank\n Third National\
|
21 |
+
\ Bank (Syracuse, New York), listed on the NRHP in New York\n Third National Bank\
|
22 |
+
\ (Sandusky, Ohio), listed on the NRHP in Ohio\n Third National Bank in Nashville,\
|
23 |
+
\ now incorporated within SunTrust Bank"
|
24 |
+
- 'S is for Sloth
|
25 |
+
|
26 |
+
I never really paid much attention to sloths until I began searching for animals
|
27 |
+
to draw for the letter S. Looking at some photos, I was shocked to see just how
|
28 |
+
much they look like Muppets in real life! They''re hilarious!'
|
29 |
+
- 'History
|
30 |
+
|
31 |
+
The Annual Review of Animal Biosciences was first published in 2013, with Harris
|
32 |
+
A. Lewin and R. Michael Roberts as the founding co-editors. Though it was initially
|
33 |
+
published in print, as of 2021 it is only published electronically. Scope and
|
34 |
+
indexing
|
35 |
+
|
36 |
+
The Annual Review of Animal Biosciences defines its scope as covering significant
|
37 |
+
developments relevant to biotechnology, genomics, genetics, veterinary medicine,
|
38 |
+
animal breeding, and conservation biology. The intended audience for the journal
|
39 |
+
is scientists and veterinarians involved with wild and domestic animals. It is
|
40 |
+
abstracted and indexed in Scopus, Science Citation Index Expanded, MEDLINE, and
|
41 |
+
Embase, among others.'
|
42 |
+
- source_sentence: What distinguished the roles of different prisoners, such as the
|
43 |
+
functionaries and the Sonderkommando, in the Auschwitz camps
|
44 |
+
sentences:
|
45 |
+
- "Michael Matthews is a South African writer, producer and director. In 2017, he\
|
46 |
+
\ directed Five Fingers for Marseilles, a film that won best film category at\
|
47 |
+
\ 14th Africa Movie Academy Awards. Early life\nMatthews was born in Durban. He\
|
48 |
+
\ studied filmmaking at the CityVarsity Cape Town campus. Career \nMatthews is\
|
49 |
+
\ the director of Five Fingers for Marseilles, a film dubbed as South African\
|
50 |
+
\ first western film."
|
51 |
+
- Warsame and Ahmed M. Hassan, who was elected to the Clarkston, Georgia City Council
|
52 |
+
on the same day, are the first Somali Americans to be elected to municipal offices
|
53 |
+
in the United States and were the highest elected Somali Americans in the country
|
54 |
+
at the time. Warsame's election set civic precedence in the Somali American community
|
55 |
+
of Minneapolis, in which his campaign energized and mobilized this sub-community's
|
56 |
+
powerful voting bloc.
|
57 |
+
- 'Designated as Aussenlager (external camp), Nebenlager (extension camp), Arbeitslager
|
58 |
+
(labor camp), or Aussenkommando (external work detail), camps were built at Blechhammer,
|
59 |
+
Jawiszowice, Jaworzno, Lagisze, Mysłowice, Trzebinia, and as far afield as the
|
60 |
+
Protectorate of Bohemia and Moravia in Czechoslovakia. Industries with satellite
|
61 |
+
camps included coal mines, foundries and other metal works, and chemical plants.
|
62 |
+
Prisoners were also made to work in forestry and farming. For example, Wirtschaftshof
|
63 |
+
Budy, in the Polish village of Budy near Brzeszcze, was a farming subcamp where
|
64 |
+
prisoners worked 12-hour days in the fields, tending animals, and making compost
|
65 |
+
by mixing human ashes from the crematoria with sod and manure. Incidents of sabotage
|
66 |
+
to decrease production took place in several subcamps, including Charlottengrube,
|
67 |
+
Gleiwitz II, and Rajsko. Living conditions in some of the camps were so poor that
|
68 |
+
they were regarded as punishment subcamps. Life in the camps
|
69 |
+
|
70 |
+
|
71 |
+
SS garrison
|
72 |
+
|
73 |
+
|
74 |
+
Rudolf Höss, born in Baden-Baden in 1900, was named the first commandant of Auschwitz
|
75 |
+
when Heinrich Himmler ordered on 27 April 1940 that the camp be established. Living
|
76 |
+
with his wife and children in a two-story stucco house near the commandant''s
|
77 |
+
and administration building, he served as commandant until 11 November 1943, with
|
78 |
+
Josef Kramer as his deputy. Succeeded as commandant by Arthur Liebehenschel, Höss
|
79 |
+
joined the SS Business and Administration Head Office in Oranienburg as director
|
80 |
+
of Amt DI, a post that made him deputy of the camps inspectorate. Richard Baer
|
81 |
+
became commandant of Auschwitz I on 11 May 1944 and Fritz Hartjenstein of Auschwitz
|
82 |
+
II from 22 November 1943, followed by Josef Kramer from 15 May 1944 until the
|
83 |
+
camp''s liquidation in January 1945. Heinrich Schwarz was commandant of Auschwitz
|
84 |
+
III from the point at which it became an autonomous camp in November 1943 until
|
85 |
+
its liquidation. Höss returned to Auschwitz between 8 May and 29 July 1944 as
|
86 |
+
the local SS garrison commander (Standortältester) to oversee the arrival of Hungary''s
|
87 |
+
Jews, which made him the superior officer of all the commandants of the Auschwitz
|
88 |
+
camps. According to Aleksander Lasik, about 6,335 people (6,161 of them men) worked
|
89 |
+
for the SS at Auschwitz over the course of the camp''s existence; 4.2 percent
|
90 |
+
were officers, 26.1 percent non-commissioned officers, and 69.7 percent rank and
|
91 |
+
file. In March 1941, there were 700 SS guards; in June 1942, 2,000; and in August
|
92 |
+
1944, 3,342. At its peak in January 1945, 4,480 SS men and 71 SS women worked
|
93 |
+
in Auschwitz; the higher number is probably attributable to the logistics of evacuating
|
94 |
+
the camp. Female guards were known as SS supervisors (SS-Aufseherinnen). Most
|
95 |
+
of the staff were from Germany or Austria, but as the war progressed, increasing
|
96 |
+
numbers of Volksdeutsche from other countries, including Czechoslovakia, Poland,
|
97 |
+
Yugoslavia, and the Baltic states, joined the SS at Auschwitz. Not all were ethnically
|
98 |
+
German. Guards were also recruited from Hungary, Romania, and Slovakia. Camp guards,
|
99 |
+
around three quarters of the SS personnel, were members of the SS-Totenkopfverbände
|
100 |
+
(death''s head units). Other SS staff worked in the medical or political departments,
|
101 |
+
or in the economic administration, which was responsible for clothing and other
|
102 |
+
supplies, including the property of dead prisoners. The SS viewed Auschwitz as
|
103 |
+
a comfortable posting; being there meant they had avoided the front and had access
|
104 |
+
to the victims'' property. Functionaries and Sonderkommando
|
105 |
+
|
106 |
+
|
107 |
+
Certain prisoners, at first non-Jewish Germans but later Jews and non-Jewish Poles,
|
108 |
+
were assigned positions of authority as Funktionshäftlinge (functionaries), which
|
109 |
+
gave them access to better housing and food. The Lagerprominenz (camp elite) included
|
110 |
+
Blockschreiber (barracks clerk), Kapo (overseer), Stubendienst (barracks orderly),
|
111 |
+
and Kommandierte (trusties). Wielding tremendous power over other prisoners, the
|
112 |
+
functionaries developed a reputation as sadists. Very few were prosecuted after
|
113 |
+
the war, because of the difficulty of determining which atrocities had been performed
|
114 |
+
by order of the SS. Although the SS oversaw the murders at each gas chamber, the
|
115 |
+
forced labor portion of the work was done by prisoners known from 1942 as the
|
116 |
+
Sonderkommando (special squad). These were mostly Jews but they included groups
|
117 |
+
such as Soviet POWs. In 1940–1941 when there was one gas chamber, there were 20
|
118 |
+
such prisoners, in late 1943 there were 400, and by 1944 during the Holocaust
|
119 |
+
in Hungary the number had risen to 874. The Sonderkommando removed goods and corpses
|
120 |
+
from the incoming trains, guided victims to the dressing rooms and gas chambers,
|
121 |
+
removed their bodies afterwards, and took their jewelry, hair, dental work, and
|
122 |
+
any precious metals from their teeth, all of which was sent to Germany. Once the
|
123 |
+
bodies were stripped of anything valuable, the Sonderkommando burned them in the
|
124 |
+
crematoria. Because they were witnesses to the mass murder, the Sonderkommando
|
125 |
+
lived separately from the other prisoners, although this rule was not applied
|
126 |
+
to the non-Jews among them. Their quality of life was further improved by their
|
127 |
+
access to the property of new arrivals, which they traded within the camp, including
|
128 |
+
with the SS. Nevertheless, their life expectancy was short; they were regularly
|
129 |
+
murdered and replaced. About 100 survived to the camp''s liquidation. They were
|
130 |
+
forced on a death march and by train to the camp at Mauthausen, where three days
|
131 |
+
later they were asked to step forward during roll call. No one did, and because
|
132 |
+
the SS did not have their records, several of them survived. Tattoos and triangles
|
133 |
+
|
134 |
+
|
135 |
+
Uniquely at Auschwitz, prisoners were tattooed with a serial number, on their
|
136 |
+
left breast for Soviet prisoners of war and on the left arm for civilians. Categories
|
137 |
+
of prisoner were distinguishable by triangular pieces of cloth (German: Winkel)
|
138 |
+
sewn onto on their jackets below their prisoner number. Political prisoners (Schutzhäftlinge
|
139 |
+
or Sch), mostly Poles, had a red triangle, while criminals (Berufsverbrecher or
|
140 |
+
BV) were mostly German and wore green. Asocial prisoners (Asoziale or Aso), which
|
141 |
+
included vagrants, prostitutes and the Roma, wore black. Purple was for Jehovah''s
|
142 |
+
Witnesses (Internationale Bibelforscher-Vereinigung or IBV)''s and pink for gay
|
143 |
+
men, who were mostly German. An estimated 5,000–15,000 gay men prosecuted under
|
144 |
+
German Penal Code Section 175 (proscribing sexual acts between men) were detained
|
145 |
+
in concentration camps, of whom an unknown number were sent to Auschwitz. Jews
|
146 |
+
wore a yellow badge, the shape of the Star of David, overlaid by a second triangle
|
147 |
+
if they also belonged to a second category. The nationality of the inmate was
|
148 |
+
indicated by a letter stitched onto the cloth. A racial hierarchy existed, with
|
149 |
+
German prisoners at the top. Next were non-Jewish prisoners from other countries.
|
150 |
+
Jewish prisoners were at the bottom. Transports
|
151 |
+
|
152 |
+
|
153 |
+
Deportees were brought to Auschwitz crammed in wretched conditions into goods
|
154 |
+
or cattle wagons, arriving near a railway station or at one of several dedicated
|
155 |
+
trackside ramps, including one next to Auschwitz I. The Altejudenrampe (old Jewish
|
156 |
+
ramp), part of the Oświęcim freight railway station, was used from 1942 to 1944
|
157 |
+
for Jewish transports. Located between Auschwitz I and Auschwitz II, arriving
|
158 |
+
at this ramp meant a 2.5 km journey to Auschwitz II and the gas chambers. Most
|
159 |
+
deportees were forced to walk, accompanied by SS men and a car with a Red Cross
|
160 |
+
symbol that carried the Zyklon B, as well as an SS doctor in case officers were
|
161 |
+
poisoned by mistake. Inmates arriving at night, or who were too weak to walk,
|
162 |
+
were taken by truck. Work on a new railway line and ramp (right) between sectors
|
163 |
+
BI and BII in Auschwitz II, was completed in May 1944 for the arrival of Hungarian
|
164 |
+
Jews between May and early July 1944. The rails led directly to the area around
|
165 |
+
the gas chambers. Life for the inmates
|
166 |
+
|
167 |
+
The day began at 4:30 am for the men (an hour later in winter), and earlier for
|
168 |
+
the women, when the block supervis'
|
169 |
+
- source_sentence: Do restaurants like Chick-fil-A have signs indicating restrictions
|
170 |
+
against LGBTQ+ individuals
|
171 |
+
sentences:
|
172 |
+
- 'Restaurants have signs like "no smoking," "no guns," "no shoes, no service,"
|
173 |
+
but never have I seen a restaurant, especially Chick-fil-A, say "no gays or lesbians."
|
174 |
+
Get on the ball
|
175 |
+
|
176 |
+
In the newspaper this past week, "St. Charles seeks input on mall," how many more
|
177 |
+
studies are they going to do'
|
178 |
+
- His excavations lead to him being convinced that this site was more than likely
|
179 |
+
a pre-ceramic age and decided to discover it further. Later Voorhies worked to
|
180 |
+
understand and evaluate the Chantuto sites and the people who inhabited this area.
|
181 |
+
- Gross domestic product (GDP) is the market value of all final goods and services
|
182 |
+
from a nation in a given year.
|
183 |
+
- source_sentence: How can Vaseline be used to help with chapped lips
|
184 |
+
sentences:
|
185 |
+
- '4. Soothe Chapped Lips
|
186 |
+
|
187 |
+
So, you probably already knew Vaseline made a great lip balm, but it can also
|
188 |
+
be used as a base in many lip scrubs, which will really come in handy during the
|
189 |
+
winter months. 5.'
|
190 |
+
- Retrieved March 30, 2005 from . Healthcare Information and Management Systems
|
191 |
+
Society (HIMSS) (2005, February).
|
192 |
+
- The Government of Zimbabwe strongly believes in the independence of the judiciary
|
193 |
+
and respects the principles of the separation of powers as set out in the Constitution
|
194 |
+
of Zimbabwe. The Government of Zimbabwe, therefore, recognises the importance
|
195 |
+
of the judiciary as a dependable interpreter of the law where various opinions
|
196 |
+
may arise.
|
197 |
+
- source_sentence: What challenges do university researchers face when trying to turn
|
198 |
+
their discoveries into commercial products
|
199 |
+
sentences:
|
200 |
+
- 'A major shakeup has taken place at the top of the Boston Celtics. Danny Ainge
|
201 |
+
has stepped down as president of basketball operations, and head coach Brad Stevens
|
202 |
+
has stepped into the role. Stevens will now lead the search for a new coach. The
|
203 |
+
team made the announcement early Wednesday, one day after the Celtics were eliminated
|
204 |
+
by the Brooklyn Nets in the first round of the Eastern Conference playoffs. “Helping
|
205 |
+
guide this organization has been the thrill of a lifetime, and having worked side-by-side
|
206 |
+
with him since he’s been here, I know we couldn’t be in better hands than with
|
207 |
+
Brad guiding the team going forward,” Ainge said in a statement. “I’m grateful
|
208 |
+
to ownership, all of my Celtics colleagues, and the best fans in basketball for
|
209 |
+
being part of the journey.”
|
210 |
+
|
211 |
+
Ainge, 62, is a franchise legend.'
|
212 |
+
- 'Alfred William Lawson (March 24, 1869 – November 29, 1954) was an English born
|
213 |
+
professional baseball player, aviator and utopian philosopher. He was a baseball
|
214 |
+
player, manager, and league promoter from 1887 through 1916 and went on to play
|
215 |
+
a pioneering role in the U.S. aircraft industry. He published two early aviation
|
216 |
+
trade journals. He is frequently cited as the inventor of the airliner and was
|
217 |
+
awarded several of the first air mail contracts, which he ultimately could not
|
218 |
+
fulfill. He founded the Lawson Aircraft Company in Green Bay, Wisconsin, to build
|
219 |
+
military training aircraft and later the Lawson Airplane Company in South Milwaukee,
|
220 |
+
Wisconsin, to build airliners. The crash of his ambitious Lawson L-4 "Midnight
|
221 |
+
Liner" during its trial flight takeoff on May 8, 1921, ended his best chance
|
222 |
+
for commercial aviation success. In 1904, he wrote a utopian novel, Born Again,
|
223 |
+
in which he developed the philosophy which later became Lawsonomy. Baseball career
|
224 |
+
(1888–1907)
|
225 |
+
|
226 |
+
|
227 |
+
He made one start for the Boston Beaneaters and two for the Pittsburgh Alleghenys
|
228 |
+
during the 1890 season. His minor league playing career lasted through 1895. He
|
229 |
+
later managed in the minors from 1905 to 1907. Union Professional League
|
230 |
+
|
231 |
+
In 1908, he started a new professional baseball league known as the Union Professional
|
232 |
+
League. The league took the field in April but folded one month later owing to
|
233 |
+
financial difficulties. Aviation career (1908–1928)
|
234 |
+
|
235 |
+
An early advocate or rather evangelist of aviation, in October 1908 Lawson started
|
236 |
+
the magazine Fly to stimulate public interest and educate readers in the fundamentals
|
237 |
+
of the new science of aviation. It sold for 10 cents a copy from newsstands across
|
238 |
+
the country. In 1910, moving to New York City, he renamed the magazine Aircraft
|
239 |
+
and published it until 1914. The magazine chronicled the technical developments
|
240 |
+
of the early aviation pioneers. Lawson was the first advocate for commercial air
|
241 |
+
travel, coining the term "airline." He also advocated for a strong American flying
|
242 |
+
force, lobbying Congress in 1913 to expand its appropriations for Army aircraft.
|
243 |
+
In early 1913, he learned to fly the Sloan-Deperdussin and the Moisant-Bleriot
|
244 |
+
monoplanes, becoming an accomplished pilot. Later that year he bought a Thomas
|
245 |
+
flying boat and became the first air commuter regularly flying from his country
|
246 |
+
house in Seidler''s Beach, New Jersey, to the foot of 75th Street in New York
|
247 |
+
City (about 35 miles). In 1917, utilizing the knowledge gained from ten years
|
248 |
+
of advocating aviation, he built his first airplane, the Lawson Military Tractor
|
249 |
+
1 (MT-1) trainer, and founded the Lawson Aircraft Corporation. The company''s
|
250 |
+
plant was sited at Green Bay, Wisconsin. There he secured a contract and built
|
251 |
+
the Lawson MT-2. He also designed the steel fuselage Lawson Armored Battler, which
|
252 |
+
never got beyond the drafting board, given doubts within the Army aviation community
|
253 |
+
and the signing of the armistice. After the war, in 1919 Lawson started a project
|
254 |
+
to build America''s first airline. He secured financial backing, and in five months
|
255 |
+
he had built and demonstrated in flight his biplane airliner, the 18-passenger
|
256 |
+
Lawson L-2. He demonstrated its capabilities in a 2000-mile multi-city tour from
|
257 |
+
Milwaukee to Chicago-Toledo-Cleveland-Buffalo-Syracuse-New york City-Washington,
|
258 |
+
D.C.-Collinsville-Dayton-Chicago and back to Milwaukee, creating a buzz of positive
|
259 |
+
press. The publicity allowed him to secure an additional $1 million to build the
|
260 |
+
26-passenger Midnight Liner. The aircraft crashed on takeoff on its maiden flight.
|
261 |
+
In late 1920, he secured government contracts for three airmail routes and to
|
262 |
+
deliver ten war planes, but owing to the fall 1920 recession, he could not secure
|
263 |
+
the necessary $100,000 in cash reserves called for in the contracts and had to
|
264 |
+
decline them.'
|
265 |
+
- 'Universities are vital to the process of innovation and advancement: they educate
|
266 |
+
students who bring new ways of thinking to old problems, and they make new discoveries
|
267 |
+
that no one else would make because no one else has the opportunity to delve so
|
268 |
+
deeply. In creating this type of refuge, we also create a comfort zone. Because
|
269 |
+
governmental support for science and technology is designed to support long-term,
|
270 |
+
high-risk work regardless of immediate return, ROI is not a factor in getting
|
271 |
+
government funding. University researchers become successful at pitching research
|
272 |
+
ideas without serious reference to commercial outcome. Peer review – which is
|
273 |
+
critical for the success of science – further reinforces this tendency. University
|
274 |
+
researchers are rewarded for thinking in this very specific way, and this creates
|
275 |
+
the comfort zone. As it dawns on a researcher that they may need to work with
|
276 |
+
a company or an entrepreneur to see their discoveries become products or services
|
277 |
+
that can benefit society, they may find themselves a victim of their own past
|
278 |
+
success. Many researchers reflexively approach companies as if they are yet another
|
279 |
+
type of funding agency, but since companies are not in the grant-making business,
|
280 |
+
a partnership fails to materialize. This basic failure to communicate means valuable
|
281 |
+
commercial opportunities are often not recognized, or when they are, the resulting
|
282 |
+
partnership does not go well.'
|
283 |
+
pipeline_tag: sentence-similarity
|
284 |
+
library_name: sentence-transformers
|
285 |
+
---
|
286 |
+
|
287 |
+
# MPNet base trained on AllNLI triplets
|
288 |
+
|
289 |
+
This is a [sentence-transformers](https://www.SBERT.net) model finetuned from [microsoft/mpnet-base](https://huggingface.co/microsoft/mpnet-base). It maps sentences & paragraphs to a 768-dimensional dense vector space and can be used for semantic textual similarity, semantic search, paraphrase mining, text classification, clustering, and more.
|
290 |
+
|
291 |
+
## Model Details
|
292 |
+
|
293 |
+
### Model Description
|
294 |
+
- **Model Type:** Sentence Transformer
|
295 |
+
- **Base model:** [microsoft/mpnet-base](https://huggingface.co/microsoft/mpnet-base) <!-- at revision 6996ce1e91bd2a9c7d7f61daec37463394f73f09 -->
|
296 |
+
- **Maximum Sequence Length:** 512 tokens
|
297 |
+
- **Output Dimensionality:** 768 dimensions
|
298 |
+
- **Similarity Function:** Cosine Similarity
|
299 |
+
<!-- - **Training Dataset:** Unknown -->
|
300 |
+
- **Language:** en
|
301 |
+
- **License:** apache-2.0
|
302 |
+
|
303 |
+
### Model Sources
|
304 |
+
|
305 |
+
- **Documentation:** [Sentence Transformers Documentation](https://sbert.net)
|
306 |
+
- **Repository:** [Sentence Transformers on GitHub](https://github.com/UKPLab/sentence-transformers)
|
307 |
+
- **Hugging Face:** [Sentence Transformers on Hugging Face](https://huggingface.co/models?library=sentence-transformers)
|
308 |
+
|
309 |
+
### Full Model Architecture
|
310 |
+
|
311 |
+
```
|
312 |
+
SentenceTransformer(
|
313 |
+
(0): Transformer({'max_seq_length': 512, 'do_lower_case': False}) with Transformer model: MPNetModel
|
314 |
+
(1): Pooling({'word_embedding_dimension': 768, 'pooling_mode_cls_token': False, 'pooling_mode_mean_tokens': True, 'pooling_mode_max_tokens': False, 'pooling_mode_mean_sqrt_len_tokens': False, 'pooling_mode_weightedmean_tokens': False, 'pooling_mode_lasttoken': False, 'include_prompt': True})
|
315 |
+
)
|
316 |
+
```
|
317 |
+
|
318 |
+
## Usage
|
319 |
+
|
320 |
+
### Direct Usage (Sentence Transformers)
|
321 |
+
|
322 |
+
First install the Sentence Transformers library:
|
323 |
+
|
324 |
+
```bash
|
325 |
+
pip install -U sentence-transformers
|
326 |
+
```
|
327 |
+
|
328 |
+
Then you can load this model and run inference.
|
329 |
+
```python
|
330 |
+
from sentence_transformers import SentenceTransformer
|
331 |
+
|
332 |
+
# Download from the 🤗 Hub
|
333 |
+
model = SentenceTransformer("Jrinky/mpnet-base-all-nli-triplet")
|
334 |
+
# Run inference
|
335 |
+
sentences = [
|
336 |
+
'What challenges do university researchers face when trying to turn their discoveries into commercial products',
|
337 |
+
'Universities are vital to the process of innovation and advancement: they educate students who bring new ways of thinking to old problems, and they make new discoveries that no one else would make because no one else has the opportunity to delve so deeply. In creating this type of refuge, we also create a comfort zone. Because governmental support for science and technology is designed to support long-term, high-risk work regardless of immediate return, ROI is not a factor in getting government funding. University researchers become successful at pitching research ideas without serious reference to commercial outcome. Peer review – which is critical for the success of science – further reinforces this tendency. University researchers are rewarded for thinking in this very specific way, and this creates the comfort zone. As it dawns on a researcher that they may need to work with a company or an entrepreneur to see their discoveries become products or services that can benefit society, they may find themselves a victim of their own past success. Many researchers reflexively approach companies as if they are yet another type of funding agency, but since companies are not in the grant-making business, a partnership fails to materialize. This basic failure to communicate means valuable commercial opportunities are often not recognized, or when they are, the resulting partnership does not go well.',
|
338 |
+
'A major shakeup has taken place at the top of the Boston Celtics. Danny Ainge has stepped down as president of basketball operations, and head coach Brad Stevens has stepped into the role. Stevens will now lead the search for a new coach. The team made the announcement early Wednesday, one day after the Celtics were eliminated by the Brooklyn Nets in the first round of the Eastern Conference playoffs. “Helping guide this organization has been the thrill of a lifetime, and having worked side-by-side with him since he’s been here, I know we couldn’t be in better hands than with Brad guiding the team going forward,” Ainge said in a statement. “I’m grateful to ownership, all of my Celtics colleagues, and the best fans in basketball for being part of the journey.”\nAinge, 62, is a franchise legend.',
|
339 |
+
]
|
340 |
+
embeddings = model.encode(sentences)
|
341 |
+
print(embeddings.shape)
|
342 |
+
# [3, 768]
|
343 |
+
|
344 |
+
# Get the similarity scores for the embeddings
|
345 |
+
similarities = model.similarity(embeddings, embeddings)
|
346 |
+
print(similarities.shape)
|
347 |
+
# [3, 3]
|
348 |
+
```
|
349 |
+
|
350 |
+
<!--
|
351 |
+
### Direct Usage (Transformers)
|
352 |
+
|
353 |
+
<details><summary>Click to see the direct usage in Transformers</summary>
|
354 |
+
|
355 |
+
</details>
|
356 |
+
-->
|
357 |
+
|
358 |
+
<!--
|
359 |
+
### Downstream Usage (Sentence Transformers)
|
360 |
+
|
361 |
+
You can finetune this model on your own dataset.
|
362 |
+
|
363 |
+
<details><summary>Click to expand</summary>
|
364 |
+
|
365 |
+
</details>
|
366 |
+
-->
|
367 |
+
|
368 |
+
<!--
|
369 |
+
### Out-of-Scope Use
|
370 |
+
|
371 |
+
*List how the model may foreseeably be misused and address what users ought not to do with the model.*
|
372 |
+
-->
|
373 |
+
|
374 |
+
<!--
|
375 |
+
## Bias, Risks and Limitations
|
376 |
+
|
377 |
+
*What are the known or foreseeable issues stemming from this model? You could also flag here known failure cases or weaknesses of the model.*
|
378 |
+
-->
|
379 |
+
|
380 |
+
<!--
|
381 |
+
### Recommendations
|
382 |
+
|
383 |
+
*What are recommendations with respect to the foreseeable issues? For example, filtering explicit content.*
|
384 |
+
-->
|
385 |
+
|
386 |
+
## Training Details
|
387 |
+
|
388 |
+
### Training Dataset
|
389 |
+
|
390 |
+
#### Unnamed Dataset
|
391 |
+
|
392 |
+
* Size: 6,433 training samples
|
393 |
+
* Columns: <code>anchor</code> and <code>positive</code>
|
394 |
+
* Approximate statistics based on the first 1000 samples:
|
395 |
+
| | anchor | positive |
|
396 |
+
|:--------|:----------------------------------------------------------------------------------|:------------------------------------------------------------------------------------|
|
397 |
+
| type | string | string |
|
398 |
+
| details | <ul><li>min: 6 tokens</li><li>mean: 16.21 tokens</li><li>max: 42 tokens</li></ul> | <ul><li>min: 5 tokens</li><li>mean: 140.69 tokens</li><li>max: 512 tokens</li></ul> |
|
399 |
+
* Samples:
|
400 |
+
| anchor | positive |
|
401 |
+
|:--------------------------------------------------------------------------------------------------------------------------------|:------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|
|
402 |
+
| <code>What type of event is being described by Pierre LeBrun in relation to the NHL</code> | <code>ESPN’s Pierre LeBrun said, “It's not just about one NHL game anymore. It's a week-long event.</code> |
|
403 |
+
| <code>Who designed the property's landscape and when was the building listed on the National Register of Historic Places</code> | <code>The property's landscape continues a circular theme, with flower beds, fencing, and parking arranged in concentric patterns around the structure. It was designed by the Washington, DC firm of Deigert & Yerkes. The building was listed on the National Register of Historic Places in 2017.</code> |
|
404 |
+
| <code>Is 'ladens' a valid word to use in Scrabble and other word games</code> | <code>Scrabble?! LADENSIs ladens valid for Scrabble? Words With Friends? Lexulous? WordFeud? Other games</code> |
|
405 |
+
* Loss: <code>selfloss.Infonce</code> with these parameters:
|
406 |
+
```json
|
407 |
+
{
|
408 |
+
"scale": 20.0,
|
409 |
+
"similarity_fct": "cos_sim"
|
410 |
+
}
|
411 |
+
```
|
412 |
+
|
413 |
+
### Evaluation Dataset
|
414 |
+
|
415 |
+
#### Unnamed Dataset
|
416 |
+
|
417 |
+
* Size: 804 evaluation samples
|
418 |
+
* Columns: <code>anchor</code> and <code>positive</code>
|
419 |
+
* Approximate statistics based on the first 804 samples:
|
420 |
+
| | anchor | positive |
|
421 |
+
|:--------|:----------------------------------------------------------------------------------|:------------------------------------------------------------------------------------|
|
422 |
+
| type | string | string |
|
423 |
+
| details | <ul><li>min: 7 tokens</li><li>mean: 16.44 tokens</li><li>max: 38 tokens</li></ul> | <ul><li>min: 8 tokens</li><li>mean: 149.21 tokens</li><li>max: 512 tokens</li></ul> |
|
424 |
+
* Samples:
|
425 |
+
| anchor | positive |
|
426 |
+
|:-------------------------------------------------------------------------------|:---------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|
|
427 |
+
| <code>What types of special events can the salon services be booked for</code> | <code>Our fabulous salon services are available at your special event! Whether it's a wedding, photo shoot, prom, or just a fun girls' night in- we do it all.</code> |
|
428 |
+
| <code>What material is the Hudson Baby plush hooded robe made of</code> | <code>Dimensions (Overall): 10 inches (L), 10 inches (H) x 1 inches (W)<br>Weight: 1 pounds<br>Textile Material: 100% Polyester<br>• Animal face plush hooded bath robe. • Made with 100% plush coral fleece fabric<br>• Soft and gentle on baby's skin<br>• Optimal for everyday use<br>• Affordable, high quality bath robe<br>Hudson Baby plush hooded robe is made of super soft, cozy plush material to dry and warm baby after bath or pool time.</code> |
|
429 |
+
| <code>Where is this uncommon species thought to occur</code> | <code>It is also thought to occur in New Zealand. It is an uncommon species, growing in "heathy woodland [in] semi shade".</code> |
|
430 |
+
* Loss: <code>selfloss.Infonce</code> with these parameters:
|
431 |
+
```json
|
432 |
+
{
|
433 |
+
"scale": 20.0,
|
434 |
+
"similarity_fct": "cos_sim"
|
435 |
+
}
|
436 |
+
```
|
437 |
+
|
438 |
+
### Training Hyperparameters
|
439 |
+
#### Non-Default Hyperparameters
|
440 |
+
|
441 |
+
- `eval_strategy`: steps
|
442 |
+
- `per_device_train_batch_size`: 32
|
443 |
+
- `per_device_eval_batch_size`: 32
|
444 |
+
- `learning_rate`: 2e-05
|
445 |
+
- `num_train_epochs`: 6
|
446 |
+
- `warmup_ratio`: 0.1
|
447 |
+
- `fp16`: True
|
448 |
+
- `batch_sampler`: no_duplicates
|
449 |
+
|
450 |
+
#### All Hyperparameters
|
451 |
+
<details><summary>Click to expand</summary>
|
452 |
+
|
453 |
+
- `overwrite_output_dir`: False
|
454 |
+
- `do_predict`: False
|
455 |
+
- `eval_strategy`: steps
|
456 |
+
- `prediction_loss_only`: True
|
457 |
+
- `per_device_train_batch_size`: 32
|
458 |
+
- `per_device_eval_batch_size`: 32
|
459 |
+
- `per_gpu_train_batch_size`: None
|
460 |
+
- `per_gpu_eval_batch_size`: None
|
461 |
+
- `gradient_accumulation_steps`: 1
|
462 |
+
- `eval_accumulation_steps`: None
|
463 |
+
- `torch_empty_cache_steps`: None
|
464 |
+
- `learning_rate`: 2e-05
|
465 |
+
- `weight_decay`: 0.0
|
466 |
+
- `adam_beta1`: 0.9
|
467 |
+
- `adam_beta2`: 0.999
|
468 |
+
- `adam_epsilon`: 1e-08
|
469 |
+
- `max_grad_norm`: 1.0
|
470 |
+
- `num_train_epochs`: 6
|
471 |
+
- `max_steps`: -1
|
472 |
+
- `lr_scheduler_type`: linear
|
473 |
+
- `lr_scheduler_kwargs`: {}
|
474 |
+
- `warmup_ratio`: 0.1
|
475 |
+
- `warmup_steps`: 0
|
476 |
+
- `log_level`: passive
|
477 |
+
- `log_level_replica`: warning
|
478 |
+
- `log_on_each_node`: True
|
479 |
+
- `logging_nan_inf_filter`: True
|
480 |
+
- `save_safetensors`: True
|
481 |
+
- `save_on_each_node`: False
|
482 |
+
- `save_only_model`: False
|
483 |
+
- `restore_callback_states_from_checkpoint`: False
|
484 |
+
- `no_cuda`: False
|
485 |
+
- `use_cpu`: False
|
486 |
+
- `use_mps_device`: False
|
487 |
+
- `seed`: 42
|
488 |
+
- `data_seed`: None
|
489 |
+
- `jit_mode_eval`: False
|
490 |
+
- `use_ipex`: False
|
491 |
+
- `bf16`: False
|
492 |
+
- `fp16`: True
|
493 |
+
- `fp16_opt_level`: O1
|
494 |
+
- `half_precision_backend`: auto
|
495 |
+
- `bf16_full_eval`: False
|
496 |
+
- `fp16_full_eval`: False
|
497 |
+
- `tf32`: None
|
498 |
+
- `local_rank`: 0
|
499 |
+
- `ddp_backend`: None
|
500 |
+
- `tpu_num_cores`: None
|
501 |
+
- `tpu_metrics_debug`: False
|
502 |
+
- `debug`: []
|
503 |
+
- `dataloader_drop_last`: False
|
504 |
+
- `dataloader_num_workers`: 0
|
505 |
+
- `dataloader_prefetch_factor`: None
|
506 |
+
- `past_index`: -1
|
507 |
+
- `disable_tqdm`: False
|
508 |
+
- `remove_unused_columns`: True
|
509 |
+
- `label_names`: None
|
510 |
+
- `load_best_model_at_end`: False
|
511 |
+
- `ignore_data_skip`: False
|
512 |
+
- `fsdp`: []
|
513 |
+
- `fsdp_min_num_params`: 0
|
514 |
+
- `fsdp_config`: {'min_num_params': 0, 'xla': False, 'xla_fsdp_v2': False, 'xla_fsdp_grad_ckpt': False}
|
515 |
+
- `fsdp_transformer_layer_cls_to_wrap`: None
|
516 |
+
- `accelerator_config`: {'split_batches': False, 'dispatch_batches': None, 'even_batches': True, 'use_seedable_sampler': True, 'non_blocking': False, 'gradient_accumulation_kwargs': None}
|
517 |
+
- `deepspeed`: None
|
518 |
+
- `label_smoothing_factor`: 0.0
|
519 |
+
- `optim`: adamw_torch
|
520 |
+
- `optim_args`: None
|
521 |
+
- `adafactor`: False
|
522 |
+
- `group_by_length`: False
|
523 |
+
- `length_column_name`: length
|
524 |
+
- `ddp_find_unused_parameters`: None
|
525 |
+
- `ddp_bucket_cap_mb`: None
|
526 |
+
- `ddp_broadcast_buffers`: False
|
527 |
+
- `dataloader_pin_memory`: True
|
528 |
+
- `dataloader_persistent_workers`: False
|
529 |
+
- `skip_memory_metrics`: True
|
530 |
+
- `use_legacy_prediction_loop`: False
|
531 |
+
- `push_to_hub`: False
|
532 |
+
- `resume_from_checkpoint`: None
|
533 |
+
- `hub_model_id`: None
|
534 |
+
- `hub_strategy`: every_save
|
535 |
+
- `hub_private_repo`: None
|
536 |
+
- `hub_always_push`: False
|
537 |
+
- `gradient_checkpointing`: False
|
538 |
+
- `gradient_checkpointing_kwargs`: None
|
539 |
+
- `include_inputs_for_metrics`: False
|
540 |
+
- `include_for_metrics`: []
|
541 |
+
- `eval_do_concat_batches`: True
|
542 |
+
- `fp16_backend`: auto
|
543 |
+
- `push_to_hub_model_id`: None
|
544 |
+
- `push_to_hub_organization`: None
|
545 |
+
- `mp_parameters`:
|
546 |
+
- `auto_find_batch_size`: False
|
547 |
+
- `full_determinism`: False
|
548 |
+
- `torchdynamo`: None
|
549 |
+
- `ray_scope`: last
|
550 |
+
- `ddp_timeout`: 1800
|
551 |
+
- `torch_compile`: False
|
552 |
+
- `torch_compile_backend`: None
|
553 |
+
- `torch_compile_mode`: None
|
554 |
+
- `dispatch_batches`: None
|
555 |
+
- `split_batches`: None
|
556 |
+
- `include_tokens_per_second`: False
|
557 |
+
- `include_num_input_tokens_seen`: False
|
558 |
+
- `neftune_noise_alpha`: None
|
559 |
+
- `optim_target_modules`: None
|
560 |
+
- `batch_eval_metrics`: False
|
561 |
+
- `eval_on_start`: False
|
562 |
+
- `use_liger_kernel`: False
|
563 |
+
- `eval_use_gather_object`: False
|
564 |
+
- `average_tokens_across_devices`: False
|
565 |
+
- `prompts`: None
|
566 |
+
- `batch_sampler`: no_duplicates
|
567 |
+
- `multi_dataset_batch_sampler`: proportional
|
568 |
+
|
569 |
+
</details>
|
570 |
+
|
571 |
+
### Training Logs
|
572 |
+
| Epoch | Step | Training Loss | Validation Loss |
|
573 |
+
|:------:|:----:|:-------------:|:---------------:|
|
574 |
+
| 0.9901 | 100 | 1.4311 | 0.2171 |
|
575 |
+
| 1.9802 | 200 | 0.237 | 0.1718 |
|
576 |
+
| 2.9703 | 300 | 0.1466 | 0.1561 |
|
577 |
+
| 3.9604 | 400 | 0.1084 | 0.1541 |
|
578 |
+
| 4.9505 | 500 | 0.0879 | 0.1528 |
|
579 |
+
| 5.9406 | 600 | 0.0794 | 0.1514 |
|
580 |
+
|
581 |
+
|
582 |
+
### Framework Versions
|
583 |
+
- Python: 3.10.12
|
584 |
+
- Sentence Transformers: 3.4.0
|
585 |
+
- Transformers: 4.48.1
|
586 |
+
- PyTorch: 2.5.1+cu124
|
587 |
+
- Accelerate: 1.3.0
|
588 |
+
- Datasets: 3.2.0
|
589 |
+
- Tokenizers: 0.21.0
|
590 |
+
|
591 |
+
## Citation
|
592 |
+
|
593 |
+
### BibTeX
|
594 |
+
|
595 |
+
#### Sentence Transformers
|
596 |
+
```bibtex
|
597 |
+
@inproceedings{reimers-2019-sentence-bert,
|
598 |
+
title = "Sentence-BERT: Sentence Embeddings using Siamese BERT-Networks",
|
599 |
+
author = "Reimers, Nils and Gurevych, Iryna",
|
600 |
+
booktitle = "Proceedings of the 2019 Conference on Empirical Methods in Natural Language Processing",
|
601 |
+
month = "11",
|
602 |
+
year = "2019",
|
603 |
+
publisher = "Association for Computational Linguistics",
|
604 |
+
url = "https://arxiv.org/abs/1908.10084",
|
605 |
+
}
|
606 |
+
```
|
607 |
+
|
608 |
+
#### Infonce
|
609 |
+
```bibtex
|
610 |
+
@misc{henderson2017efficient,
|
611 |
+
title={Efficient Natural Language Response Suggestion for Smart Reply},
|
612 |
+
author={Matthew Henderson and Rami Al-Rfou and Brian Strope and Yun-hsuan Sung and Laszlo Lukacs and Ruiqi Guo and Sanjiv Kumar and Balint Miklos and Ray Kurzweil},
|
613 |
+
year={2017},
|
614 |
+
eprint={1705.00652},
|
615 |
+
archivePrefix={arXiv},
|
616 |
+
primaryClass={cs.CL}
|
617 |
+
}
|
618 |
+
```
|
619 |
+
|
620 |
+
<!--
|
621 |
+
## Glossary
|
622 |
+
|
623 |
+
*Clearly define terms in order to be accessible across audiences.*
|
624 |
+
-->
|
625 |
+
|
626 |
+
<!--
|
627 |
+
## Model Card Authors
|
628 |
+
|
629 |
+
*Lists the people who create the model card, providing recognition and accountability for the detailed work that goes into its construction.*
|
630 |
+
-->
|
631 |
+
|
632 |
+
<!--
|
633 |
+
## Model Card Contact
|
634 |
+
|
635 |
+
*Provides a way for people who have updates to the Model Card, suggestions, or questions, to contact the Model Card authors.*
|
636 |
+
-->
|
config.json
ADDED
@@ -0,0 +1,24 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_name_or_path": "microsoft/mpnet-base",
|
3 |
+
"architectures": [
|
4 |
+
"MPNetModel"
|
5 |
+
],
|
6 |
+
"attention_probs_dropout_prob": 0.1,
|
7 |
+
"bos_token_id": 0,
|
8 |
+
"eos_token_id": 2,
|
9 |
+
"hidden_act": "gelu",
|
10 |
+
"hidden_dropout_prob": 0.1,
|
11 |
+
"hidden_size": 768,
|
12 |
+
"initializer_range": 0.02,
|
13 |
+
"intermediate_size": 3072,
|
14 |
+
"layer_norm_eps": 1e-05,
|
15 |
+
"max_position_embeddings": 514,
|
16 |
+
"model_type": "mpnet",
|
17 |
+
"num_attention_heads": 12,
|
18 |
+
"num_hidden_layers": 12,
|
19 |
+
"pad_token_id": 1,
|
20 |
+
"relative_attention_num_buckets": 32,
|
21 |
+
"torch_dtype": "float32",
|
22 |
+
"transformers_version": "4.48.1",
|
23 |
+
"vocab_size": 30527
|
24 |
+
}
|
config_sentence_transformers.json
ADDED
@@ -0,0 +1,10 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"__version__": {
|
3 |
+
"sentence_transformers": "3.4.0",
|
4 |
+
"transformers": "4.48.1",
|
5 |
+
"pytorch": "2.5.1+cu124"
|
6 |
+
},
|
7 |
+
"prompts": {},
|
8 |
+
"default_prompt_name": null,
|
9 |
+
"similarity_fn_name": "cosine"
|
10 |
+
}
|
model.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:81fec4167b7d016f1b784e1238cc5a091f315a1a18fcbde26126971fa0466e36
|
3 |
+
size 437967672
|
modules.json
ADDED
@@ -0,0 +1,14 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
[
|
2 |
+
{
|
3 |
+
"idx": 0,
|
4 |
+
"name": "0",
|
5 |
+
"path": "",
|
6 |
+
"type": "sentence_transformers.models.Transformer"
|
7 |
+
},
|
8 |
+
{
|
9 |
+
"idx": 1,
|
10 |
+
"name": "1",
|
11 |
+
"path": "1_Pooling",
|
12 |
+
"type": "sentence_transformers.models.Pooling"
|
13 |
+
}
|
14 |
+
]
|
sentence_bert_config.json
ADDED
@@ -0,0 +1,4 @@
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"max_seq_length": 512,
|
3 |
+
"do_lower_case": false
|
4 |
+
}
|
special_tokens_map.json
ADDED
@@ -0,0 +1,51 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"bos_token": {
|
3 |
+
"content": "<s>",
|
4 |
+
"lstrip": false,
|
5 |
+
"normalized": false,
|
6 |
+
"rstrip": false,
|
7 |
+
"single_word": false
|
8 |
+
},
|
9 |
+
"cls_token": {
|
10 |
+
"content": "<s>",
|
11 |
+
"lstrip": false,
|
12 |
+
"normalized": true,
|
13 |
+
"rstrip": false,
|
14 |
+
"single_word": false
|
15 |
+
},
|
16 |
+
"eos_token": {
|
17 |
+
"content": "</s>",
|
18 |
+
"lstrip": false,
|
19 |
+
"normalized": false,
|
20 |
+
"rstrip": false,
|
21 |
+
"single_word": false
|
22 |
+
},
|
23 |
+
"mask_token": {
|
24 |
+
"content": "<mask>",
|
25 |
+
"lstrip": true,
|
26 |
+
"normalized": false,
|
27 |
+
"rstrip": false,
|
28 |
+
"single_word": false
|
29 |
+
},
|
30 |
+
"pad_token": {
|
31 |
+
"content": "<pad>",
|
32 |
+
"lstrip": false,
|
33 |
+
"normalized": false,
|
34 |
+
"rstrip": false,
|
35 |
+
"single_word": false
|
36 |
+
},
|
37 |
+
"sep_token": {
|
38 |
+
"content": "</s>",
|
39 |
+
"lstrip": false,
|
40 |
+
"normalized": true,
|
41 |
+
"rstrip": false,
|
42 |
+
"single_word": false
|
43 |
+
},
|
44 |
+
"unk_token": {
|
45 |
+
"content": "[UNK]",
|
46 |
+
"lstrip": false,
|
47 |
+
"normalized": false,
|
48 |
+
"rstrip": false,
|
49 |
+
"single_word": false
|
50 |
+
}
|
51 |
+
}
|
tokenizer.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
tokenizer_config.json
ADDED
@@ -0,0 +1,66 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"added_tokens_decoder": {
|
3 |
+
"0": {
|
4 |
+
"content": "<s>",
|
5 |
+
"lstrip": false,
|
6 |
+
"normalized": false,
|
7 |
+
"rstrip": false,
|
8 |
+
"single_word": false,
|
9 |
+
"special": true
|
10 |
+
},
|
11 |
+
"1": {
|
12 |
+
"content": "<pad>",
|
13 |
+
"lstrip": false,
|
14 |
+
"normalized": false,
|
15 |
+
"rstrip": false,
|
16 |
+
"single_word": false,
|
17 |
+
"special": true
|
18 |
+
},
|
19 |
+
"2": {
|
20 |
+
"content": "</s>",
|
21 |
+
"lstrip": false,
|
22 |
+
"normalized": false,
|
23 |
+
"rstrip": false,
|
24 |
+
"single_word": false,
|
25 |
+
"special": true
|
26 |
+
},
|
27 |
+
"3": {
|
28 |
+
"content": "<unk>",
|
29 |
+
"lstrip": false,
|
30 |
+
"normalized": true,
|
31 |
+
"rstrip": false,
|
32 |
+
"single_word": false,
|
33 |
+
"special": true
|
34 |
+
},
|
35 |
+
"104": {
|
36 |
+
"content": "[UNK]",
|
37 |
+
"lstrip": false,
|
38 |
+
"normalized": false,
|
39 |
+
"rstrip": false,
|
40 |
+
"single_word": false,
|
41 |
+
"special": true
|
42 |
+
},
|
43 |
+
"30526": {
|
44 |
+
"content": "<mask>",
|
45 |
+
"lstrip": true,
|
46 |
+
"normalized": false,
|
47 |
+
"rstrip": false,
|
48 |
+
"single_word": false,
|
49 |
+
"special": true
|
50 |
+
}
|
51 |
+
},
|
52 |
+
"bos_token": "<s>",
|
53 |
+
"clean_up_tokenization_spaces": false,
|
54 |
+
"cls_token": "<s>",
|
55 |
+
"do_lower_case": true,
|
56 |
+
"eos_token": "</s>",
|
57 |
+
"extra_special_tokens": {},
|
58 |
+
"mask_token": "<mask>",
|
59 |
+
"model_max_length": 512,
|
60 |
+
"pad_token": "<pad>",
|
61 |
+
"sep_token": "</s>",
|
62 |
+
"strip_accents": null,
|
63 |
+
"tokenize_chinese_chars": true,
|
64 |
+
"tokenizer_class": "MPNetTokenizer",
|
65 |
+
"unk_token": "[UNK]"
|
66 |
+
}
|
vocab.txt
ADDED
The diff for this file is too large to render.
See raw diff
|
|