forked from opentiny/tiny-engine-backend-java
-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathEmbeddingMatchDto.java
More file actions
107 lines (89 loc) · 2.94 KB
/
EmbeddingMatchDto.java
File metadata and controls
107 lines (89 loc) · 2.94 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
/**
* Copyright (c) 2023 - present TinyEngine Authors.
* Copyright (c) 2023 - present Huawei Cloud Computing Technologies Co., Ltd.
*
* Use of this source code is governed by an MIT-style license.
*
* THE OPEN SOURCE SOFTWARE IN THIS PRODUCT IS DISTRIBUTED IN THE HOPE THAT IT WILL BE USEFUL,
* BUT WITHOUT ANY WARRANTY, WITHOUT EVEN THE IMPLIED WARRANTY OF MERCHANTABILITY OR FITNESS FOR
* A PARTICULAR PURPOSE. SEE THE APPLICABLE LICENSES FOR MORE DETAILS.
*
*/
package com.tinyengine.it.rag.entity;
import dev.langchain4j.data.segment.TextSegment;
import dev.langchain4j.store.embedding.EmbeddingMatch;
import lombok.Data;
import java.time.LocalDateTime;
import java.util.HashMap;
import java.util.Map;
/**
* EmbeddingMatch dto
*/
@Data
public class EmbeddingMatchDto {
/**
* 向量id
*/
private String embeddingId;
/**
* 创建时间
*/
private LocalDateTime createTime;
/**
* 匹配分数
*/
private Double score;
/**
* 文档内容
*/
private String content;
/**
* 元数据
*/
private Map<String, String> metadata;
/**
* 集合名称
*/
private String collection;
/**
* 来源
*/
private String source;
public static EmbeddingMatchDto from(EmbeddingMatch<TextSegment> match) {
EmbeddingMatchDto dto = new EmbeddingMatchDto();
dto.setEmbeddingId(match.embeddingId());
dto.setScore(match.score());
dto.setCreateTime(LocalDateTime.now());
// 安全地提取内容
if (match.embedded() != null) {
dto.setContent(match.embedded().text());
// 提取元数据和特定字段
if (match.embedded().metadata() != null) {
Map<String, String> metadataMap = new HashMap<>();
// 提取常用字段
String collection = match.embedded().metadata().getString("collection");
String documentSetId = match.embedded().metadata().getString("documentSetId");
String source = match.embedded().metadata().getString("source");
dto.setCollection(collection);
dto.setSource(source);
// 将常用字段也放入 metadata map
if (collection != null) {
metadataMap.put("collection", collection);
}
if (documentSetId != null) {
metadataMap.put("documentSetId", documentSetId);
}
if (source != null) {
metadataMap.put("source", source);
}
dto.setMetadata(metadataMap);
} else {
dto.setMetadata(new HashMap<>());
}
} else {
dto.setContent("");
dto.setMetadata(new HashMap<>());
}
return dto;
}
}