Skip to content

Commit ee752be

Browse files
authored
Merge pull request #57 from Paulanerus/dev
Dev
2 parents eda4afe + c8db5bd commit ee752be

5 files changed

Lines changed: 17 additions & 5 deletions

File tree

api/src/main/kotlin/dev/paulee/api/internal/Embedding.kt

Lines changed: 10 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -29,6 +29,16 @@ object Embedding {
2929
maxLength = 512,
3030
)
3131
),
32+
AncientGreekVariantSBERT(
33+
"Paulanerus/AncientGreekVariantSBERT-ONNX",
34+
"model_management.ancient_greek_variant_sbert.desc",
35+
"Paulanerus",
36+
"110M",
37+
"https://huggingface.co/Paulanerus/AncientGreekVariantSBERT-ONNX",
38+
ModelData(
39+
maxLength = 512,
40+
)
41+
),
3242
GreekTransfer(
3343
"onnx-community/stsb-xlm-r-greek-transfer-ONNX",
3444
"model_management.greek_transfer.desc",

core/src/main/kotlin/dev/paulee/core/data/provider/EmbeddingProvider.kt

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -122,7 +122,7 @@ internal object EmbeddingProvider {
122122
createRawEmbeddings(model, texts)
123123
}
124124

125-
Embedding.Model.AncientGreekBert -> {
125+
Embedding.Model.AncientGreekBert, Embedding.Model.AncientGreekVariantSBERT -> {
126126
val texts = values.map { it.stripAccentsAndLowercase() }
127127

128128
createRawEmbeddings(model, texts)
@@ -323,7 +323,7 @@ internal object EmbeddingProvider {
323323
fun runSession(sessionInputs: Map<String, OnnxTensor>): Array<FloatArray> {
324324
session.run(sessionInputs).use { result ->
325325
val batch = when (model) {
326-
Embedding.Model.AncientGreekBert, Embedding.Model.GreekTransfer -> {
326+
Embedding.Model.AncientGreekBert, Embedding.Model.GreekTransfer, Embedding.Model.AncientGreekVariantSBERT -> {
327327
val ov = result.get("last_hidden_state")
328328
.orElseThrow { IllegalStateException("No output named last_hidden_state") }
329329

gradle.properties

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -14,7 +14,7 @@ onnx.version=1.22.0
1414
duckdb.version=1.4.1.0
1515
caffeine.version=3.2.2
1616

17-
api.version=1.16.4
18-
core.version=1.18.13
17+
api.version=1.16.5
18+
core.version=1.18.14
1919
ui.version=1.19.5
20-
app.version=1.6.6
20+
app.version=1.6.7

ui/src/main/resources/i18n/strings_de.properties

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -45,6 +45,7 @@ model_management.by=von {0}
4545
model_management.embedding_gemma.desc=Ein schlankes Embedding-Modell basierend auf Gemma 3 und auf über 100 gesprochenen Sprachen trainiert.
4646
model_management.ancient_greek_bert.desc=Ein auf griechische und altgriechische Texte spezialisiertes BERT-Modell.
4747
model_management.greek_transfer.desc=Ein Modell auf Basis von XLM-RoBERTa-base, das mithilfe von Transferlernen auf griechischen und englischen Satzpaaren für semantische Textähnlichkeit trainiert wurde.
48+
model_management.ancient_greek_variant_sbert.desc=Ein Sentence-BERT-Modell, speziell für altgriechische biblische Texte zur semantischen Ähnlichkeitsanalyse, Variantenerkennung und Clustering von Versen und Textabschnitten.
4849

4950
# Data Loader Window
5051

ui/src/main/resources/i18n/strings_en.properties

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -45,6 +45,7 @@ model_management.by=by {0}
4545
model_management.embedding_gemma.desc=A lightweight embedding model based on Gemma 3 and trained on 100+ spoken languages.
4646
model_management.ancient_greek_bert.desc=A BERT model specialized for Greek and Ancient Greek texts.
4747
model_management.greek_transfer.desc=A model based on XLM-RoBERTa-base and trained via transfer learning on Greek and English sentence pairs for semantic textual similarity.
48+
model_management.ancient_greek_variant_sbert.desc=A Sentence-BERT model fine-tuned on Ancient Greek biblical texts for semantic similarity, variant detection, and clustering of verses and passages.
4849

4950
# Data Loader Window
5051

0 commit comments

Comments
 (0)